Repository: dellhpc/omnia
Branch: main
Commit: 483ce3abf010
Files: 1073
Total size: 5.3 MB

Directory structure:
gitextract_fe371nzs/

├── .all-contributorsrc
├── .ansible-lint
├── .config/
│   ├── ansible-lint.yml
│   └── requirements.yml
├── .gitattributes
├── .github/
│   ├── ISSUE_TEMPLATE/
│   │   ├── bug_report.md
│   │   ├── feature_request.md
│   │   └── logo_community.md
│   ├── branch-switcher.yml
│   ├── pull_request_template.md
│   ├── stale.yml
│   └── workflows/
│       ├── ansible-lint.yml
│       └── pylint.yml
├── .gitignore
├── .metadata/
│   └── omnia_version
├── .readthedocs.yaml
├── CODE_OF_CONDUCT.md
├── CONTRIBUTING.md
├── LICENSE
├── README.md
├── SECURITY.md
├── ansible.cfg
├── build_image_aarch64/
│   ├── ansible.cfg
│   ├── build_image_aarch64.yml
│   └── roles/
│       ├── fetch_packages/
│       │   ├── tasks/
│       │   │   ├── aarch64_build_image_completion.yml
│       │   │   ├── build_stream_prerequisite.yml
│       │   │   ├── check_aarch64_fg.yml
│       │   │   ├── fetch_packages.yml
│       │   │   ├── fetch_pulp_repos.yml
│       │   │   └── main.yml
│       │   └── vars/
│       │       └── main.yml
│       ├── image_creation/
│       │   ├── tasks/
│       │   │   ├── build_base_image.yml
│       │   │   ├── build_compute_image.yml
│       │   │   └── main.yml
│       │   ├── templates/
│       │   │   ├── base_image_template.j2
│       │   │   └── compute_images_templates.j2
│       │   └── vars/
│       │       └── main.yml
│       └── prepare_arm_node/
│           ├── tasks/
│           │   ├── gather_oim_data.yml
│           │   └── main.yml
│           └── vars/
│               └── main.yml
├── build_image_x86_64/
│   ├── ansible.cfg
│   ├── build_image_x86_64.yml
│   └── roles/
│       ├── fetch_packages/
│       │   ├── tasks/
│       │   │   ├── build_stream_prerequisite.yml
│       │   │   ├── check_x86_64_fg.yml
│       │   │   ├── fetch_packages.yml
│       │   │   ├── fetch_pulp_repos.yml
│       │   │   ├── main.yml
│       │   │   └── x86_64_build_image_completion.yml
│       │   └── vars/
│       │       └── main.yml
│       └── image_creation/
│           ├── tasks/
│           │   ├── build_base_image.yml
│           │   ├── build_compute_image.yml
│           │   ├── main.yml
│           │   └── prepare_pulp_image.yml
│           ├── templates/
│           │   ├── base_image_template.j2
│           │   └── compute_images_templates.j2
│           └── vars/
│               └── main.yml
├── build_stream/
│   ├── .gitignore
│   ├── README.md
│   ├── __init__.py
│   ├── api/
│   │   ├── __init__.py
│   │   ├── auth/
│   │   │   ├── __init__.py
│   │   │   ├── jwt_handler.py
│   │   │   ├── password_handler.py
│   │   │   ├── routes.py
│   │   │   ├── schemas.py
│   │   │   └── service.py
│   │   ├── build_image/
│   │   │   ├── __init__.py
│   │   │   ├── dependencies.py
│   │   │   ├── routes.py
│   │   │   └── schemas.py
│   │   ├── catalog_roles/
│   │   │   ├── __init__.py
│   │   │   ├── dependencies.py
│   │   │   ├── routes.py
│   │   │   ├── schemas.py
│   │   │   └── service.py
│   │   ├── dependencies.py
│   │   ├── generate_input_files/
│   │   │   ├── __init__.py
│   │   │   ├── dependencies.py
│   │   │   ├── routes.py
│   │   │   └── schemas.py
│   │   ├── jobs/
│   │   │   ├── __init__.py
│   │   │   ├── dependencies.py
│   │   │   ├── routes.py
│   │   │   └── schemas.py
│   │   ├── local_repo/
│   │   │   ├── __init__.py
│   │   │   ├── dependencies.py
│   │   │   ├── routes.py
│   │   │   └── schemas.py
│   │   ├── logging_utils.py
│   │   ├── parse_catalog/
│   │   │   ├── __init__.py
│   │   │   ├── dependencies.py
│   │   │   ├── routes.py
│   │   │   ├── schemas.py
│   │   │   └── service.py
│   │   ├── router.py
│   │   ├── validate/
│   │   │   ├── __init__.py
│   │   │   ├── dependencies.py
│   │   │   ├── routes.py
│   │   │   └── schemas.py
│   │   └── vault_client.py
│   ├── build_stream.ini
│   ├── common/
│   │   ├── __init__.py
│   │   ├── config.py
│   │   ├── constants.py
│   │   ├── logging.py
│   │   └── user_messages.py
│   ├── container.py
│   ├── core/
│   │   ├── __init__.py
│   │   ├── artifacts/
│   │   │   ├── __init__.py
│   │   │   ├── entities.py
│   │   │   ├── exceptions.py
│   │   │   ├── interfaces.py
│   │   │   ├── ports.py
│   │   │   └── value_objects.py
│   │   ├── build/
│   │   │   └── __init__.py
│   │   ├── build_image/
│   │   │   ├── __init__.py
│   │   │   ├── entities.py
│   │   │   ├── exceptions.py
│   │   │   ├── repositories.py
│   │   │   ├── services.py
│   │   │   └── value_objects.py
│   │   ├── catalog/
│   │   │   ├── ADAPTER_POLICY_GUIDE.md
│   │   │   ├── README.md
│   │   │   ├── __init__.py
│   │   │   ├── adapter.py
│   │   │   ├── adapter_policy.py
│   │   │   ├── adapter_policy_schema_consts.py
│   │   │   ├── exceptions.py
│   │   │   ├── generator.py
│   │   │   ├── models.py
│   │   │   ├── parser.py
│   │   │   ├── resources/
│   │   │   │   ├── AdapterPolicySchema.json
│   │   │   │   ├── CatalogSchema.json
│   │   │   │   ├── RootLevelSchema.json
│   │   │   │   └── adapter_policy_default.json
│   │   │   ├── test_fixtures/
│   │   │   │   ├── adapter_policy_test.json
│   │   │   │   ├── catalog_rhel.json
│   │   │   │   └── functional_layer.json
│   │   │   ├── tests/
│   │   │   │   ├── sample.py
│   │   │   │   ├── test_adapter_cli_defaults.py
│   │   │   │   ├── test_adapter_policy.py
│   │   │   │   ├── test_generator_cli_defaults.py
│   │   │   │   ├── test_generator_package_list.py
│   │   │   │   ├── test_generator_roles.py
│   │   │   │   └── test_parser_defaults.py
│   │   │   └── utils.py
│   │   ├── common/
│   │   │   └── __init__.py
│   │   ├── exceptions.py
│   │   ├── jobs/
│   │   │   ├── __init__.py
│   │   │   ├── entities/
│   │   │   │   ├── __init__.py
│   │   │   │   ├── audit.py
│   │   │   │   ├── idempotency.py
│   │   │   │   ├── job.py
│   │   │   │   └── stage.py
│   │   │   ├── exceptions.py
│   │   │   ├── repositories.py
│   │   │   ├── services.py
│   │   │   └── value_objects.py
│   │   ├── localrepo/
│   │   │   ├── __init__.py
│   │   │   ├── entities.py
│   │   │   ├── exceptions.py
│   │   │   ├── repositories.py
│   │   │   ├── services.py
│   │   │   └── value_objects.py
│   │   ├── utils/
│   │   │   └── __init__.py
│   │   └── validate/
│   │       ├── __init__.py
│   │       ├── entities.py
│   │       ├── exceptions.py
│   │       └── services.py
│   ├── doc/
│   │   ├── README.md
│   │   ├── __init__.py
│   │   ├── build_image.md
│   │   ├── catalog.md
│   │   ├── jobs.md
│   │   ├── local_repo.md
│   │   └── validation.md
│   ├── generate_catalog.py
│   ├── generate_catalog_examples.py
│   ├── infra/
│   │   ├── __init__.py
│   │   ├── artifact_store/
│   │   │   ├── __init__.py
│   │   │   ├── file_artifact_store.py
│   │   │   ├── in_memory_artifact_metadata.py
│   │   │   └── in_memory_artifact_store.py
│   │   ├── db/
│   │   │   ├── __init__.py
│   │   │   ├── alembic/
│   │   │   │   ├── env.py
│   │   │   │   ├── script.py.mako
│   │   │   │   └── versions/
│   │   │   │       ├── 20260219_001_create_jobs_table.py
│   │   │   │       ├── 20260219_002_create_stages_table.py
│   │   │   │       ├── 20260219_003_create_idempotency_keys_table.py
│   │   │   │       ├── 20260219_004_create_audit_events_table.py
│   │   │   │       └── 20260219_005_create_artifact_metadata_table.py
│   │   │   ├── alembic.ini
│   │   │   ├── config.py
│   │   │   ├── mappers.py
│   │   │   ├── models.py
│   │   │   ├── repositories.py
│   │   │   └── session.py
│   │   ├── id_generator.py
│   │   └── repositories/
│   │       ├── __init__.py
│   │       ├── in_memory.py
│   │       ├── nfs_build_image_inventory_repository.py
│   │       ├── nfs_input_repository.py
│   │       ├── nfs_playbook_queue_request_repository.py
│   │       └── nfs_playbook_queue_result_repository.py
│   ├── main.py
│   ├── orchestrator/
│   │   ├── __init__.py
│   │   ├── build_image/
│   │   │   ├── __init__.py
│   │   │   ├── commands/
│   │   │   │   ├── __init__.py
│   │   │   │   └── create_build_image.py
│   │   │   ├── dtos/
│   │   │   │   ├── __init__.py
│   │   │   │   └── build_image_response.py
│   │   │   └── use_cases/
│   │   │       ├── __init__.py
│   │   │       └── create_build_image.py
│   │   ├── catalog/
│   │   │   ├── commands/
│   │   │   │   ├── generate_input_files.py
│   │   │   │   └── parse_catalog.py
│   │   │   ├── dtos.py
│   │   │   └── use_cases/
│   │   │       ├── __init__.py
│   │   │       ├── generate_input_files.py
│   │   │       └── parse_catalog.py
│   │   ├── common/
│   │   │   ├── __init__.py
│   │   │   └── result_poller.py
│   │   ├── jobs/
│   │   │   ├── __init__.py
│   │   │   ├── commands/
│   │   │   │   ├── __init__.py
│   │   │   │   └── create_job.py
│   │   │   ├── dtos/
│   │   │   │   ├── __init__.py
│   │   │   │   └── job_response.py
│   │   │   └── use_cases/
│   │   │       ├── __init__.py
│   │   │       └── create_job.py
│   │   ├── local_repo/
│   │   │   ├── __init__.py
│   │   │   ├── commands/
│   │   │   │   ├── __init__.py
│   │   │   │   └── create_local_repo.py
│   │   │   ├── dtos/
│   │   │   │   ├── __init__.py
│   │   │   │   └── local_repo_response.py
│   │   │   ├── result_poller.py
│   │   │   └── use_cases/
│   │   │       ├── __init__.py
│   │   │       └── create_local_repo.py
│   │   └── validate/
│   │       ├── __init__.py
│   │       ├── commands/
│   │       │   ├── __init__.py
│   │       │   └── validate_image_on_test.py
│   │       ├── dtos/
│   │       │   ├── __init__.py
│   │       │   └── validate_image_on_test_response.py
│   │       └── use_cases/
│   │           ├── __init__.py
│   │           └── validate_image_on_test.py
│   ├── playbook-watcher/
│   │   └── playbook_watcher_service.py
│   ├── pytest.ini
│   ├── requirements-dev.txt
│   ├── requirements.txt
│   ├── scripts/
│   │   └── generate_jwt_keys.sh
│   ├── tests/
│   │   ├── README.md
│   │   ├── __init__.py
│   │   ├── conftest.py
│   │   ├── demo/
│   │   │   └── buildstream_demo.py
│   │   ├── end_to_end/
│   │   │   └── api/
│   │   │       ├── conftest.py
│   │   │       ├── test_api_flow_e2e.py
│   │   │       ├── test_build_image_e2e.py
│   │   │       ├── test_generate_input_files_e2e.py
│   │   │       ├── test_parse_catalog_e2e.py
│   │   │       ├── test_register_e2e.py
│   │   │       └── test_token_e2e.py
│   │   ├── integration/
│   │   │   ├── api/
│   │   │   │   ├── auth/
│   │   │   │   │   ├── conftest.py
│   │   │   │   │   ├── test_register.py
│   │   │   │   │   └── test_token.py
│   │   │   │   ├── build_image/
│   │   │   │   │   ├── __init__.py
│   │   │   │   │   ├── conftest.py
│   │   │   │   │   └── test_build_image_api.py
│   │   │   │   ├── catalog_roles/
│   │   │   │   │   ├── __init__.py
│   │   │   │   │   ├── conftest.py
│   │   │   │   │   └── test_catalog_roles_api.py
│   │   │   │   ├── conftest.py
│   │   │   │   ├── generate_input_files/
│   │   │   │   │   ├── conftest.py
│   │   │   │   │   ├── test_generate_input_files_api.py
│   │   │   │   │   ├── test_generate_input_files_artifact_integration.py
│   │   │   │   │   └── test_generate_input_files_routes.py
│   │   │   │   ├── jobs/
│   │   │   │   │   ├── conftest.py
│   │   │   │   │   ├── test_create_job_api.py
│   │   │   │   │   ├── test_delete_job_api.py
│   │   │   │   │   └── test_get_job_api.py
│   │   │   │   ├── local_repo/
│   │   │   │   │   ├── __init__.py
│   │   │   │   │   ├── conftest.py
│   │   │   │   │   ├── test_create_local_repo_api.py
│   │   │   │   │   └── test_create_local_repo_edge_cases.py
│   │   │   │   ├── parse_catalog/
│   │   │   │   │   ├── conftest.py
│   │   │   │   │   ├── test_parse_catalog_api.py
│   │   │   │   │   ├── test_parse_catalog_artifact_integration.py
│   │   │   │   │   └── test_parse_catalog_routes.py
│   │   │   │   └── validate/
│   │   │   │       ├── __init__.py
│   │   │   │       ├── conftest.py
│   │   │   │       ├── test_models.py
│   │   │   │       └── test_validate_image_on_test_api.py
│   │   │   ├── conftest.py
│   │   │   ├── core/
│   │   │   │   └── catalog/
│   │   │   │       ├── test_adapter_cli_defaults.py
│   │   │   │       ├── test_adapter_policy.py
│   │   │   │       ├── test_generator_cli_defaults.py
│   │   │   │       ├── test_generator_package_list.py
│   │   │   │       └── test_generator_roles.py
│   │   │   └── infra/
│   │   │       ├── artifact_store/
│   │   │       │   └── test_file_artifact_store.py
│   │   │       └── db/
│   │   │           ├── conftest.py
│   │   │           └── test_sql_repositories.py
│   │   ├── mocks/
│   │   │   ├── __init__.py
│   │   │   ├── mock_jwt_handler.py
│   │   │   └── mock_vault_client.py
│   │   ├── others/
│   │   │   ├── __init__.py
│   │   │   └── test_dependency_rules.py
│   │   ├── performance/
│   │   │   └── test_local_repo_performance.py
│   │   ├── unit/
│   │   │   ├── __init__.py
│   │   │   ├── api/
│   │   │   │   ├── auth/
│   │   │   │   │   ├── test_password_handler.py
│   │   │   │   │   ├── test_service.py
│   │   │   │   │   └── test_token_service.py
│   │   │   │   ├── build_image/
│   │   │   │   │   ├── __init__.py
│   │   │   │   │   └── test_routes.py
│   │   │   │   ├── catalog_roles/
│   │   │   │   │   ├── __init__.py
│   │   │   │   │   └── test_catalog_roles_service.py
│   │   │   │   ├── jobs/
│   │   │   │   │   ├── test_dependencies.py
│   │   │   │   │   └── test_schemas.py
│   │   │   │   ├── local_repo/
│   │   │   │   │   ├── test_local_repo_dependencies.py
│   │   │   │   │   ├── test_local_repo_schemas.py
│   │   │   │   │   └── test_routes.py
│   │   │   │   └── validate/
│   │   │   │       ├── __init__.py
│   │   │   │       └── test_routes.py
│   │   │   ├── core/
│   │   │   │   ├── __init__.py
│   │   │   │   ├── artifacts/
│   │   │   │   │   ├── __init__.py
│   │   │   │   │   ├── conftest.py
│   │   │   │   │   ├── test_exceptions.py
│   │   │   │   │   └── test_value_objects.py
│   │   │   │   ├── build_image/
│   │   │   │   │   ├── __init__.py
│   │   │   │   │   ├── test_entities.py
│   │   │   │   │   ├── test_services.py
│   │   │   │   │   └── test_value_objects.py
│   │   │   │   ├── catalog/
│   │   │   │   │   ├── test_exceptions.py
│   │   │   │   │   ├── test_generate_software_config.py
│   │   │   │   │   ├── test_parser.py
│   │   │   │   │   └── test_parser_defaults.py
│   │   │   │   ├── jobs/
│   │   │   │   │   ├── __init__.py
│   │   │   │   │   ├── entities/
│   │   │   │   │   │   ├── __init__.py
│   │   │   │   │   │   ├── conftest.py
│   │   │   │   │   │   ├── test_audit.py
│   │   │   │   │   │   ├── test_idempotency.py
│   │   │   │   │   │   ├── test_job.py
│   │   │   │   │   │   └── test_stage.py
│   │   │   │   │   ├── test_exceptions.py
│   │   │   │   │   └── test_value_objects.py
│   │   │   │   ├── localrepo/
│   │   │   │   │   ├── __init__.py
│   │   │   │   │   ├── test_entities.py
│   │   │   │   │   ├── test_exceptions.py
│   │   │   │   │   ├── test_services.py
│   │   │   │   │   └── test_value_objects.py
│   │   │   │   └── validate/
│   │   │   │       ├── __init__.py
│   │   │   │       ├── test_entities.py
│   │   │   │       ├── test_exceptions.py
│   │   │   │       └── test_services.py
│   │   │   ├── infra/
│   │   │   │   ├── __init__.py
│   │   │   │   ├── artifact_store/
│   │   │   │   │   ├── __init__.py
│   │   │   │   │   ├── conftest.py
│   │   │   │   │   ├── test_in_memory_artifact_metadata.py
│   │   │   │   │   └── test_in_memory_artifact_store.py
│   │   │   │   ├── db/
│   │   │   │   │   ├── test_mappers.py
│   │   │   │   │   └── test_repositories_unit.py
│   │   │   │   ├── test_id_generator.py
│   │   │   │   ├── test_nfs_input_directory_repository.py
│   │   │   │   ├── test_nfs_playbook_queue_result_service.py
│   │   │   │   └── test_nfs_repositories.py
│   │   │   └── orchestrator/
│   │   │       ├── __init__.py
│   │   │       ├── build_image/
│   │   │       │   ├── __init__.py
│   │   │       │   └── test_create_build_image_use_case.py
│   │   │       ├── catalog/
│   │   │       │   ├── conftest.py
│   │   │       │   ├── test_generate_input_files_command.py
│   │   │       │   ├── test_generate_input_files_use_case.py
│   │   │       │   ├── test_parse_catalog_command.py
│   │   │       │   └── test_parse_catalog_use_case.py
│   │   │       ├── common/
│   │   │       │   ├── __init__.py
│   │   │       │   └── test_result_poller.py
│   │   │       ├── jobs/
│   │   │       │   ├── __init__.py
│   │   │       │   └── use_cases/
│   │   │       │       ├── __init__.py
│   │   │       │       ├── conftest.py
│   │   │       │       └── test_create_job.py
│   │   │       ├── local_repo/
│   │   │       │   ├── __init__.py
│   │   │       │   ├── test_commands.py
│   │   │       │   ├── test_dtos.py
│   │   │       │   ├── test_result_poller.py
│   │   │       │   └── test_use_case.py
│   │   │       └── validate/
│   │   │           ├── __init__.py
│   │   │           └── test_validate_image_on_test_use_case.py
│   │   └── utils/
│   │       ├── __init__.py
│   │       └── test_data.py
│   └── utils/
│       └── __init__.py
├── common/
│   ├── library/
│   │   ├── module_utils/
│   │   │   ├── build_image/
│   │   │   │   ├── __init__.py
│   │   │   │   ├── common_functions.py
│   │   │   │   └── config.py
│   │   │   ├── discovery/
│   │   │   │   ├── __init__.py
│   │   │   │   └── standard_functions.py
│   │   │   ├── input_validation/
│   │   │   │   ├── __init__.py
│   │   │   │   ├── common_utils/
│   │   │   │   │   ├── __init__.py
│   │   │   │   │   ├── config.py
│   │   │   │   │   ├── data_fetch.py
│   │   │   │   │   ├── data_validation.py
│   │   │   │   │   ├── data_verification.py
│   │   │   │   │   ├── en_us_validation_msg.py
│   │   │   │   │   ├── logical_validation.py
│   │   │   │   │   ├── slurm_conf_utils.py
│   │   │   │   │   ├── timezone.txt
│   │   │   │   │   └── validation_utils.py
│   │   │   │   ├── schema/
│   │   │   │   │   ├── __init__.py
│   │   │   │   │   ├── additional_software.json
│   │   │   │   │   ├── build_stream_config.json
│   │   │   │   │   ├── credential_rules.json
│   │   │   │   │   ├── functional_groups_config.json
│   │   │   │   │   ├── gitlab_config.json
│   │   │   │   │   ├── high_availability_config.json
│   │   │   │   │   ├── k8s_scheduler.json
│   │   │   │   │   ├── local_repo_config.json
│   │   │   │   │   ├── network_spec.json
│   │   │   │   │   ├── omnia_config.json
│   │   │   │   │   ├── provision_config.json
│   │   │   │   │   ├── security_config.json
│   │   │   │   │   ├── slurm_config_parameters.json
│   │   │   │   │   ├── software_config.json
│   │   │   │   │   ├── storage_config.json
│   │   │   │   │   └── telemetry_config.json
│   │   │   │   └── validation_flows/
│   │   │   │       ├── __init__.py
│   │   │   │       ├── build_stream_validation.py
│   │   │   │       ├── common_validation.py
│   │   │   │       ├── csi_driver_validation.py
│   │   │   │       ├── gitlab_validation.py
│   │   │   │       ├── high_availability_validation.py
│   │   │   │       ├── local_repo_validation.py
│   │   │   │       ├── provision_validation.py
│   │   │   │       └── scheduler_validation.py
│   │   │   └── local_repo/
│   │   │       ├── __init__.py
│   │   │       ├── common_functions.py
│   │   │       ├── config.py
│   │   │       ├── container_repo_utils.py
│   │   │       ├── download_common.py
│   │   │       ├── download_image.py
│   │   │       ├── download_rpm.py
│   │   │       ├── parse_and_download.py
│   │   │       ├── process_metadata.py
│   │   │       ├── process_parallel.py
│   │   │       ├── registry_utils.py
│   │   │       ├── rest_client.py
│   │   │       ├── software_utils.py
│   │   │       ├── standard_logger.py
│   │   │       ├── user_image_utility.py
│   │   │       └── validate_utils.py
│   │   └── modules/
│   │       ├── additional_images_collector.py
│   │       ├── base_image_package_collector.py
│   │       ├── cert_vault_handler.py
│   │       ├── check_user_registry.py
│   │       ├── delete_idracips_from_mysqldb.py
│   │       ├── disable_idrac_telemetry.py
│   │       ├── enable_telemetry_service.py
│   │       ├── fetch_credential_rule.py
│   │       ├── fetch_idrac_ips.py
│   │       ├── fetch_mapping_details.py
│   │       ├── fetch_roles_config.py
│   │       ├── fetch_software_arch.py
│   │       ├── fetch_telemetry_status.py
│   │       ├── functional_group_parser.py
│   │       ├── generate_argon2_password.py
│   │       ├── generate_functional_groups.py
│   │       ├── generate_ssha_password.py
│   │       ├── generate_xname_in_mapping_file.py
│   │       ├── get_service_cluster_info.py
│   │       ├── group_package_map.py
│   │       ├── idrac_telemetry_filter.py
│   │       ├── image_package_collector.py
│   │       ├── insert_idracips_mysqldb.py
│   │       ├── localrepo_metadata_manager.py
│   │       ├── parallel_file_copy.py
│   │       ├── parallel_tasks.py
│   │       ├── prepare_tasklist.py
│   │       ├── process_rpm_config.py
│   │       ├── pulp_cleanup.py
│   │       ├── read_idracips_from_mysqldb.py
│   │       ├── slurm_conf.py
│   │       ├── update_bmc_group_entry.py
│   │       ├── validate_bmc_group_data.py
│   │       ├── validate_credentials.py
│   │       ├── validate_input.py
│   │       └── validate_user_repo.py
│   ├── tasks/
│   │   ├── common/
│   │   │   ├── decrypt_include_encrypt.yml
│   │   │   ├── get_container_image_list.yml
│   │   │   ├── openchami_auth.yml
│   │   │   └── validate_image_tars.yml
│   │   ├── provision/
│   │   │   └── main.yml
│   │   ├── scheduler/
│   │   │   └── main.yml
│   │   └── telemetry/
│   │       └── main.yml
│   └── vars/
│       ├── common_messages.yml
│       ├── common_vars.yml
│       ├── encrypt_files_vars.yml
│       ├── image_vars.yml
│       ├── openchami_image_cmd.yml
│       ├── openchami_vars.yml
│       ├── provision_messages.yml
│       ├── provision_vars.yml
│       ├── scheduler_messages.yml
│       ├── scheduler_vars.yml
│       ├── telemetry_messages.yml
│       └── telemetry_vars.yml
├── discovery/
│   ├── ansible.cfg
│   ├── discovery.yml
│   └── roles/
│       ├── README.md
│       ├── configure_ochami/
│       │   ├── README.md
│       │   ├── tasks/
│       │   │   ├── configure_bss_cloud_init.yml
│       │   │   ├── configure_bss_group.yml
│       │   │   ├── configure_cloud_init_common.yml
│       │   │   ├── configure_cloud_init_group.yml
│       │   │   ├── create_groups.yml
│       │   │   ├── create_groups_common.yml
│       │   │   ├── delete_smd_config.yml
│       │   │   ├── discover_mapping_nodes.yml
│       │   │   ├── discovery_completion.yml
│       │   │   ├── fetch_additional_images.yml
│       │   │   ├── main.yml
│       │   │   └── update_smd_groups.yaml
│       │   ├── templates/
│       │   │   ├── bss/
│       │   │   │   └── bss.yaml.j2
│       │   │   ├── cloud_init/
│       │   │   │   ├── ci-defaults.yaml.j2
│       │   │   │   ├── ci-group-common.yaml.j2
│       │   │   │   ├── ci-group-default_x86_64.yaml.j2
│       │   │   │   ├── ci-group-login_compiler_node_aarch64.yaml.j2
│       │   │   │   ├── ci-group-login_compiler_node_x86_64.yaml.j2
│       │   │   │   ├── ci-group-login_node_aarch64.yaml.j2
│       │   │   │   ├── ci-group-login_node_x86_64.yaml.j2
│       │   │   │   ├── ci-group-service_kube_control_plane_first_x86_64.yaml.j2
│       │   │   │   ├── ci-group-service_kube_control_plane_x86_64.yaml.j2
│       │   │   │   ├── ci-group-service_kube_node_x86_64.yaml.j2
│       │   │   │   ├── ci-group-slurm_control_node_x86_64.yaml.j2
│       │   │   │   ├── ci-group-slurm_node_aarch64.yaml.j2
│       │   │   │   └── ci-group-slurm_node_x86_64.yaml.j2
│       │   │   ├── doca-ofed/
│       │   │   │   ├── configure-ib-network.sh.j2
│       │   │   │   └── doca-install.sh.j2
│       │   │   ├── hpc_tools/
│       │   │   │   ├── configure_nvhpc_env.sh.j2
│       │   │   │   ├── configure_ucx_openmpi_env.sh.j2
│       │   │   │   ├── export_nvhpc_env.sh.j2
│       │   │   │   ├── install_nvhpc_sdk.sh.j2
│       │   │   │   ├── install_openmpi.sh.j2
│       │   │   │   ├── install_ucx.sh.j2
│       │   │   │   └── setup_nvhpc_sdk.sh.j2
│       │   │   ├── ldms/
│       │   │   │   └── ldms_sampler.sh.j2
│       │   │   ├── nodes/
│       │   │   │   ├── apptainer_mirror.conf.j2
│       │   │   │   ├── bmc_group_data.csv.j2
│       │   │   │   ├── groups.yaml.j2
│       │   │   │   ├── groups_common.yaml.j2
│       │   │   │   ├── hostname.yaml.j2
│       │   │   │   └── nodes.yaml.j2
│       │   │   ├── openldap/
│       │   │   │   ├── sssd.conf.j2
│       │   │   │   └── update_ldap_conf.sh.j2
│       │   │   ├── pull_additional_images.yaml.j2
│       │   │   ├── slurm/
│       │   │   │   └── check_slurm_controller_status.sh.j2
│       │   │   └── telemetry/
│       │   │       └── telemetry.sh.j2
│       │   └── vars/
│       │       └── main.yml
│       ├── discovery_validations/
│       │   ├── README.md
│       │   ├── tasks/
│       │   │   ├── build_stream_prerequisite.yml
│       │   │   ├── include_inputs.yml
│       │   │   ├── include_software_config.yml
│       │   │   ├── main.yml
│       │   │   ├── update_hosts.yml
│       │   │   ├── validate_image.yml
│       │   │   ├── validate_mapping_file.yml
│       │   │   ├── validate_mapping_mechanism.yml
│       │   │   ├── validate_oim_timezone.yml
│       │   │   ├── validate_openldap_container.yml
│       │   │   └── validate_telemetry_config.yml
│       │   └── vars/
│       │       └── main.yml
│       ├── k8s_config/
│       │   ├── README.md
│       │   ├── files/
│       │   │   └── empty_certificate_template.yml
│       │   ├── tasks/
│       │   │   ├── create_k8s_config_nfs.yml
│       │   │   ├── create_node_dir.yml
│       │   │   ├── get_powerscale_dependencies.yml
│       │   │   └── main.yml
│       │   ├── templates/
│       │   │   └── ps_storage_class.j2
│       │   └── vars/
│       │       └── main.yml
│       ├── nfs_client/
│       │   ├── README.md
│       │   ├── tasks/
│       │   │   ├── main.yml
│       │   │   └── nfs_client.yml
│       │   └── vars/
│       │       └── main.yml
│       ├── openldap/
│       │   ├── README.md
│       │   ├── tasks/
│       │   │   └── main.yml
│       │   └── vars/
│       │       └── main.yml
│       ├── passwordless_ssh/
│       │   ├── tasks/
│       │   │   ├── build_host_lists.yml
│       │   │   ├── configure_oim_ssh.yml
│       │   │   ├── main.yml
│       │   │   └── read_nodes_yaml.yml
│       │   └── vars/
│       │       └── main.yml
│       ├── slurm_config/
│       │   ├── README.md
│       │   ├── defaults/
│       │   │   └── main.yml
│       │   ├── tasks/
│       │   │   ├── backup_conf.yml
│       │   │   ├── build_slurm_conf.yml
│       │   │   ├── check_ctld_running.yml
│       │   │   ├── confs.yml
│       │   │   ├── create_slurm_dir.yml
│       │   │   ├── detect_busy_nodes.yml
│       │   │   ├── drain_and_remove_node.yml
│       │   │   ├── exist_dir.yml
│       │   │   ├── extract_path_overrides.yml
│       │   │   ├── handle_extra_confs.yml
│       │   │   ├── hpc_tools.yml
│       │   │   ├── main.yml
│       │   │   ├── openldap_config.yml
│       │   │   ├── read_node_homogeneous.yml
│       │   │   ├── read_node_idrac.yml
│       │   │   ├── read_node_idrac_group.yml
│       │   │   ├── read_slurm_hostnames.yml
│       │   │   ├── remove_node.yml
│       │   │   ├── storage.yml
│       │   │   ├── update_hosts_munge.yml
│       │   │   └── validate_path_overrides.yml
│       │   ├── templates/
│       │   │   ├── all_other.conf.j2
│       │   │   ├── container_image.list.j2
│       │   │   ├── download_container_image.sh.j2
│       │   │   ├── logout_user.sh.j2
│       │   │   └── mariadb-server.cnf.j2
│       │   └── vars/
│       │       └── main.yml
│       └── telemetry/
│           ├── README.md
│           ├── files/
│           │   └── nersc-ldms-aggr/
│           │       ├── .gitignore
│           │       ├── Makefile
│           │       ├── README.md
│           │       ├── health_check.bash
│           │       ├── host_map.slurm-cluster.json
│           │       ├── make_host_map.bash
│           │       ├── make_host_map.dell.py
│           │       ├── manifest.yaml.in
│           │       ├── mkmanifest.py
│           │       ├── nersc-ldms-aggr/
│           │       │   ├── Chart.yaml
│           │       │   └── templates/
│           │       │       ├── NetworkAttachmentDefinition.yaml
│           │       │       ├── Service.nersc-ldms-agg.yaml
│           │       │       ├── Service.nersc-ldms-store.yaml
│           │       │       ├── Statefulset.nersc-ldms-agg.yaml
│           │       │       └── Statefulset.nersc-ldms-store.yaml
│           │       ├── nersc_ldms_make_ldms_config.py
│           │       └── scripts/
│           │           ├── decomp.json
│           │           ├── kafka.conf
│           │           ├── ldms_ls.bash
│           │           ├── ldms_msg_publish.py
│           │           ├── ldms_msg_subscribe.py
│           │           ├── ldms_stats.bash
│           │           ├── ldmsd.bash
│           │           ├── ldmsd_stream.bash
│           │           └── start_munge.bash
│           ├── tasks/
│           │   ├── apply_telemetry_on_upgrade.yml
│           │   ├── check_pxe_changes.yml
│           │   ├── generate_service_cluster_metadata.yml
│           │   ├── generate_telemetry_deployments.yml
│           │   ├── load_service_images.yml
│           │   ├── main.yml
│           │   ├── read_software_config.yml
│           │   ├── restart_ldms_configs.yml
│           │   ├── telemetry_prereq.yml
│           │   ├── update_ldms_agg_config.yml
│           │   ├── update_ldms_sampler.yml
│           │   └── validate_idrac_inventory.yml
│           ├── templates/
│           │   └── telemetry/
│           │       ├── cleanup_telemetry.sh.j2
│           │       ├── common/
│           │       │   ├── telemetry_cleaner_rbac.yaml.j2
│           │       │   ├── telemetry_namespace_creation.yaml.j2
│           │       │   ├── telemetry_pod_cleanup.yaml.j2
│           │       │   └── telemetry_secret_creation.yaml.j2
│           │       ├── idrac_telemetry/
│           │       │   └── idrac_telemetry_statefulset.yaml.j2
│           │       ├── kafka/
│           │       │   ├── kafka.kafka.yaml.j2
│           │       │   ├── kafka.kafka_bridge.yaml.j2
│           │       │   ├── kafka.kafka_bridge_lb.yaml.j2
│           │       │   ├── kafka.kafkapump_user.yaml.j2
│           │       │   ├── kafka.tls_test_job.yaml.j2
│           │       │   └── kafka.topic.yaml.j2
│           │       ├── kustomization.yaml.j2
│           │       ├── ldms/
│           │       │   ├── host_map.slurm-cluster.json.j2
│           │       │   ├── ldms_machine_config.json.j2
│           │       │   ├── ldmsauth.conf.j2
│           │       │   ├── ldmsd.sampler.env.j2
│           │       │   ├── sampler.conf.j2
│           │       │   └── values.yaml.j2
│           │       └── victoria/
│           │           ├── gen_victoria_certs.sh.j2
│           │           ├── victoria-agent-deployment.yaml.j2
│           │           ├── victoria-cluster-vminsert.yaml.j2
│           │           ├── victoria-cluster-vmselect.yaml.j2
│           │           ├── victoria-cluster-vmstorage.yaml.j2
│           │           ├── victoria-statefulset.yaml.j2
│           │           ├── victoria-tls-secret.yaml.j2
│           │           ├── victoria-tls-test-job.yaml.j2
│           │           ├── victoria-vmagent-rbac.yaml.j2
│           │           └── vmagent-scrape-config.yaml.j2
│           └── vars/
│               └── main.yml
├── docs/
│   └── README.rst
├── examples/
│   ├── catalog/
│   │   ├── catalog_rhel.json
│   │   ├── catalog_rhel_aarch64_with_slurm_only.json
│   │   ├── catalog_rhel_with_ucx_openmpi.json
│   │   ├── catalog_rhel_x86_64_with_slurm_only.json
│   │   └── mapping_file_software_config/
│   │       ├── catalog_rhel_aarch64_with_slurm_only_json/
│   │       │   ├── pxe_mapping_file.csv
│   │       │   └── software_config.json
│   │       ├── catalog_rhel_json/
│   │       │   ├── pxe_mapping_file.csv
│   │       │   └── software_config.json
│   │       ├── catalog_rhel_with_ucx_openmpi_json/
│   │       │   ├── pxe_mapping_file.csv
│   │       │   └── software_config.json
│   │       └── catalog_rhel_x86_64_with_slurm_only_json/
│   │           ├── pxe_mapping_file.csv
│   │           └── software_config.json
│   ├── input_template/
│   │   └── bare_metal_slurm/
│   │       ├── aarch64/
│   │       │   ├── with_service_k8s/
│   │       │   │   ├── only_login_compiler_node/
│   │       │   │   │   ├── high_availability_config.yml
│   │       │   │   │   ├── local_repo_config.yml
│   │       │   │   │   ├── network_spec.yml
│   │       │   │   │   ├── omnia_config.yml
│   │       │   │   │   ├── provision_config.yml
│   │       │   │   │   ├── security_config.yml
│   │       │   │   │   ├── software_config.json
│   │       │   │   │   ├── storage_config.yml
│   │       │   │   │   ├── telemetry_config.yml
│   │       │   │   │   └── user_registry_credential.yml
│   │       │   │   └── only_login_node/
│   │       │   │       ├── high_availability_config.yml
│   │       │   │       ├── local_repo_config.yml
│   │       │   │       ├── network_spec.yml
│   │       │   │       ├── omnia_config.yml
│   │       │   │       ├── provision_config.yml
│   │       │   │       ├── security_config.yml
│   │       │   │       ├── software_config.json
│   │       │   │       ├── storage_config.yml
│   │       │   │       ├── telemetry_config.yml
│   │       │   │       └── user_registry_credential.yml
│   │       │   └── without_service_k8s/
│   │       │       ├── only_login_compiler_node/
│   │       │       │   ├── high_availability_config.yml
│   │       │       │   ├── local_repo_config.yml
│   │       │       │   ├── network_spec.yml
│   │       │       │   ├── omnia_config.yml
│   │       │       │   ├── provision_config.yml
│   │       │       │   ├── security_config.yml
│   │       │       │   ├── software_config.json
│   │       │       │   ├── storage_config.yml
│   │       │       │   ├── telemetry_config.yml
│   │       │       │   └── user_registry_credential.yml
│   │       │       └── only_login_node/
│   │       │           ├── high_availability_config.yml
│   │       │           ├── local_repo_config.yml
│   │       │           ├── network_spec.yml
│   │       │           ├── omnia_config.yml
│   │       │           ├── provision_config.yml
│   │       │           ├── security_config.yml
│   │       │           ├── software_config.json
│   │       │           ├── storage_config.yml
│   │       │           ├── telemetry_config.yml
│   │       │           └── user_registry_credential.yml
│   │       └── x86_64/
│   │           ├── with_service_k8s/
│   │           │   ├── only_login_compiler_node/
│   │           │   │   ├── high_availability_config.yml
│   │           │   │   ├── local_repo_config.yml
│   │           │   │   ├── network_spec.yml
│   │           │   │   ├── omnia_config.yml
│   │           │   │   ├── provision_config.yml
│   │           │   │   ├── security_config.yml
│   │           │   │   ├── software_config.json
│   │           │   │   ├── storage_config.yml
│   │           │   │   ├── telemetry_config.yml
│   │           │   │   └── user_registry_credential.yml
│   │           │   └── only_login_node/
│   │           │       ├── high_availability_config.yml
│   │           │       ├── local_repo_config.yml
│   │           │       ├── network_spec.yml
│   │           │       ├── omnia_config.yml
│   │           │       ├── provision_config.yml
│   │           │       ├── security_config.yml
│   │           │       ├── software_config.json
│   │           │       ├── storage_config.yml
│   │           │       ├── telemetry_config.yml
│   │           │       └── user_registry_credential.yml
│   │           └── without_service_k8s/
│   │               ├── only_login_compiler_node/
│   │               │   ├── high_availability_config.yml
│   │               │   ├── local_repo_config.yml
│   │               │   ├── network_spec.yml
│   │               │   ├── omnia_config.yml
│   │               │   ├── provision_config.yml
│   │               │   ├── security_config.yml
│   │               │   ├── software_config.json
│   │               │   ├── storage_config.yml
│   │               │   ├── telemetry_config.yml
│   │               │   └── user_registry_credential.yml
│   │               └── only_login_node/
│   │                   ├── high_availability_config.yml
│   │                   ├── local_repo_config.yml
│   │                   ├── network_spec.yml
│   │                   ├── omnia_config.yml
│   │                   ├── provision_config.yml
│   │                   ├── security_config.yml
│   │                   ├── software_config.json
│   │                   ├── storage_config.yml
│   │                   ├── telemetry_config.yml
│   │                   └── user_registry_credential.yml
│   ├── inventory/
│   │   └── bmc_inventory_file
│   ├── pxe_mapping_file.csv
│   ├── rhel_software_config.json
│   ├── slurm_conf/
│   │   ├── cgroup.conf
│   │   ├── slurm.conf
│   │   └── slurmdbd.conf
│   └── software_config_template/
│       ├── template_rhel_10.0_multi_arch_software_config.json
│       └── template_rhel_10.0_x86-64_software_config.json
├── gitlab/
│   ├── ansible.cfg
│   ├── cleanup_gitlab.yml
│   ├── gitlab.yml
│   └── roles/
│       ├── cleanup_gitlab/
│       │   ├── tasks/
│       │   │   ├── cleanup_buildstream_oauth.yml
│       │   │   ├── cleanup_cicd.yml
│       │   │   ├── cleanup_credentials.yml
│       │   │   ├── cleanup_directories.yml
│       │   │   ├── cleanup_packages.yml
│       │   │   ├── cleanup_runner.yml
│       │   │   ├── cleanup_services.yml
│       │   │   ├── cleanup_summary.yml
│       │   │   ├── cleanup_tls.yml
│       │   │   └── main.yml
│       │   └── vars/
│       │       └── main.yml
│       ├── gitlab_passwordless_ssh/
│       │   ├── files/
│       │   │   └── check_gitlab_port.sh
│       │   ├── tasks/
│       │   │   ├── authorize_key.yml
│       │   │   ├── generate_keypair.yml
│       │   │   ├── main.yml
│       │   │   ├── prereq_checks.yml
│       │   │   └── validate_ssh.yml
│       │   └── vars/
│       │       └── main.yml
│       └── hosted_gitlab/
│           ├── files/
│           │   └── .gitlab-ci.yml
│           ├── tasks/
│           │   ├── check_oim_prerequisites.yml
│           │   ├── configure_firewall.yml
│           │   ├── configure_gitlab.yml
│           │   ├── create_directories.yml
│           │   ├── create_project.yml
│           │   ├── create_trigger.yml
│           │   ├── deploy_runner.yml
│           │   ├── display_summary.yml
│           │   ├── generate_tls_certs.yml
│           │   ├── install_gitlab.yml
│           │   ├── install_packages.yml
│           │   ├── main.yml
│           │   ├── podman_login.yml
│           │   ├── prereq_checks.yml
│           │   ├── push_ci_files.yml
│           │   ├── root_password_change.yml
│           │   ├── set_pipeline_variables.yml
│           │   └── validate_prerequisites.yml
│           ├── templates/
│           │   ├── gitlab.rb.j2
│           │   ├── gitlab_runner.container.j2
│           │   └── san.cnf.j2
│           └── vars/
│               └── main.yml
├── input/
│   ├── build_stream_config.yml
│   ├── config/
│   │   ├── aarch64/
│   │   │   └── rhel/
│   │   │       └── 10.0/
│   │   │           ├── additional_packages.json
│   │   │           ├── admin_debug_packages.json
│   │   │           ├── default_packages.json
│   │   │           ├── ldms.json
│   │   │           ├── openldap.json
│   │   │           ├── openmpi.json
│   │   │           ├── slurm_custom.json
│   │   │           └── ucx.json
│   │   └── x86_64/
│   │       └── rhel/
│   │           └── 10.0/
│   │               ├── additional_packages.json
│   │               ├── admin_debug_packages.json
│   │               ├── csi_driver_powerscale.json
│   │               ├── default_packages.json
│   │               ├── ldms.json
│   │               ├── openldap.json
│   │               ├── openmpi.json
│   │               ├── service_k8s.json
│   │               ├── slurm_custom.json
│   │               └── ucx.json
│   ├── gitlab_config.yml
│   ├── high_availability_config.yml
│   ├── local_repo_config.yml
│   ├── network_spec.yml
│   ├── omnia_config.yml
│   ├── provision_config.yml
│   ├── pxe_mapping_file.csv
│   ├── security_config.yml
│   ├── software_config.json
│   ├── storage_config.yml
│   ├── telemetry_config.yml
│   └── user_registry_credential.yml
├── input_validation/
│   ├── ansible.cfg
│   ├── roles/
│   │   ├── validate_input/
│   │   │   ├── tasks/
│   │   │   │   └── main.yml
│   │   │   └── vars/
│   │   │       └── main.yml
│   │   └── validate_subscription/
│   │       ├── tasks/
│   │       │   ├── check_rhel_subscription.yml
│   │       │   └── configure_rhel_os_urls.yml
│   │       └── vars/
│   │           └── main.yml
│   └── validate_config.yml
├── local_repo/
│   ├── ansible.cfg
│   ├── local_repo.yml
│   ├── pulp_cleanup.yml
│   └── roles/
│       ├── parse_and_download/
│       │   ├── tasks/
│       │   │   ├── arch_component_loop.yml
│       │   │   ├── create_metadata.yml
│       │   │   ├── execute_parallel_tasks.yml
│       │   │   ├── localrepo_completion.yml
│       │   │   ├── main.yml
│       │   │   └── process_rpm_repo.yml
│       │   ├── templates/
│       │   │   └── local_repo_access.yml.j2
│       │   └── vars/
│       │       └── main.yml
│       ├── pulp_validation/
│       │   ├── tasks/
│       │   │   ├── check_pulp_status.yml
│       │   │   ├── main.yml
│       │   │   └── read_network_spec.yml
│       │   └── vars/
│       │       └── main.yml
│       └── validation/
│           ├── tasks/
│           │   ├── check_additional_packages_images.yml
│           │   ├── check_images_per_arch.yml
│           │   ├── display_msg.yml
│           │   ├── main.yml
│           │   ├── prerequisites.yml
│           │   ├── validate_metadata.yml
│           │   └── validate_software_config_json.yml
│           └── vars/
│               └── main.yml
├── omnia.sh
├── prepare_oim/
│   ├── ansible.cfg
│   ├── prepare_oim.yml
│   └── roles/
│       ├── deploy_containers/
│       │   ├── auth/
│       │   │   ├── files/
│       │   │   │   ├── bootstrap.ldif
│       │   │   │   └── slapd.conf
│       │   │   ├── tasks/
│       │   │   │   ├── configure_bootstrap_ldif.yml
│       │   │   │   ├── configure_slapd_conf.yml
│       │   │   │   ├── deploy_auth_service.yml
│       │   │   │   ├── generate_ldap_password_hashes.yml
│       │   │   │   ├── include_security_config.yml
│       │   │   │   └── main.yml
│       │   │   ├── templates/
│       │   │   │   └── auth.j2
│       │   │   └── vars/
│       │   │       └── main.yml
│       │   ├── build_stream/
│       │   │   ├── handlers/
│       │   │   │   └── main.yml
│       │   │   ├── tasks/
│       │   │   │   ├── deploy_build_stream.yml
│       │   │   │   ├── enable_watcher_service.yml
│       │   │   │   └── main.yml
│       │   │   ├── templates/
│       │   │   │   ├── build_stream.j2
│       │   │   │   └── playbook_watcher.service.j2
│       │   │   └── vars/
│       │   │       └── main.yml
│       │   ├── common/
│       │   │   ├── tasks/
│       │   │   │   ├── aarch64_prereq.yml
│       │   │   │   ├── add_known_hosts.yml
│       │   │   │   ├── configure_chrony.yml
│       │   │   │   ├── firewall_settings.yml
│       │   │   │   ├── main.yml
│       │   │   │   ├── omnia_service.yml
│       │   │   │   ├── package_installation.yml
│       │   │   │   ├── podman_login.yml
│       │   │   │   └── prepare_oim_completion.yml
│       │   │   ├── templates/
│       │   │   │   ├── bmc_group_data.j2
│       │   │   │   └── omnia.service.j2
│       │   │   └── vars/
│       │   │       └── main.yml
│       │   ├── openchami/
│       │   │   ├── tasks/
│       │   │   │   ├── deploy_openchami.yml
│       │   │   │   ├── deployment_prereq.yml
│       │   │   │   ├── main.yml
│       │   │   │   └── verify_openchami.yml
│       │   │   ├── templates/
│       │   │   │   ├── configs.yaml.j2
│       │   │   │   └── inventory.yaml.j2
│       │   │   └── vars/
│       │   │       └── main.yml
│       │   ├── postgres/
│       │   │   ├── tasks/
│       │   │   │   ├── deploy_postgres.yml
│       │   │   │   └── main.yml
│       │   │   ├── templates/
│       │   │   │   ├── init_build_stream_db.sql.j2
│       │   │   │   └── postgres.j2
│       │   │   └── vars/
│       │   │       └── main.yml
│       │   └── pulp/
│       │       ├── tasks/
│       │       │   ├── create_pulp_config_http.yml
│       │       │   ├── create_pulp_config_https.yml
│       │       │   ├── deploy_pulp_container_http.yml
│       │       │   ├── deploy_pulp_container_https.yml
│       │       │   ├── deployment_prereq.yml
│       │       │   ├── main.yml
│       │       │   └── reload_pulp_nginx.yml
│       │       ├── templates/
│       │       │   ├── http_quadlet.j2
│       │       │   ├── https_quadlet.j2
│       │       │   ├── nginx_conf.j2
│       │       │   └── settings_template.j2
│       │       └── vars/
│       │           └── main.yml
│       └── prepare_oim_validation/
│           ├── tasks/
│           │   ├── check_k8s_support.yml
│           │   ├── check_openldap_support.yml
│           │   ├── include_local_repo_config.yml
│           │   ├── main.yml
│           │   ├── pre_requisite.yml
│           │   ├── validate_network_spec.yml
│           │   └── validate_passwordless_ssh_oim.yml
│           └── vars/
│               └── main.yml
├── telemetry/
│   ├── ansible.cfg
│   ├── roles/
│   │   ├── idrac_telemetry/
│   │   │   ├── tasks/
│   │   │   │   ├── create_telemetry_report.yml
│   │   │   │   ├── initiate_telemetry_service_cluster.yml
│   │   │   │   ├── main.yml
│   │   │   │   ├── remove_deleted_nodes.yml
│   │   │   │   ├── trigger_telemetry_collection.yml
│   │   │   │   └── validate_bmcips_reachability.yml
│   │   │   ├── templates/
│   │   │   │   └── telemetry_report.j2
│   │   │   └── vars/
│   │   │       └── main.yml
│   │   ├── service_k8s_telemetry/
│   │   │   ├── tasks/
│   │   │   │   ├── main.yml
│   │   │   │   └── update_metadata_file.yml
│   │   │   └── vars/
│   │   │       └── main.yml
│   │   └── telemetry_validation/
│   │       ├── files/
│   │       │   └── timezone.txt
│   │       ├── tasks/
│   │       │   ├── main.yml
│   │       │   ├── validate_idrac_inventory.yml
│   │       │   ├── validate_telemetry_config.yml
│   │       │   └── validation_status_check.yml
│   │       └── vars/
│   │           └── main.yml
│   └── telemetry.yml
├── upgrade/
│   ├── ansible.cfg
│   ├── main.yml
│   ├── roles/
│   │   ├── import_input_parameters/
│   │   │   ├── tasks/
│   │   │   │   ├── display_warnings.yml
│   │   │   │   ├── main.yml
│   │   │   │   ├── precheck_backup_location.yml
│   │   │   │   ├── restore_input_files.yml
│   │   │   │   ├── restore_omnia_config_credentials.yml
│   │   │   │   ├── restore_single_input_file.yml
│   │   │   │   ├── restore_user_registry_credential.yml
│   │   │   │   ├── set_backup_location.yml
│   │   │   │   ├── transform_high_availability_config.yml
│   │   │   │   ├── transform_local_repo_config.yml
│   │   │   │   ├── transform_network_spec.yml
│   │   │   │   ├── transform_omnia_config.yml
│   │   │   │   ├── transform_provision_config.yml
│   │   │   │   ├── transform_storage_config.yml
│   │   │   │   └── transform_telemetry_config.yml
│   │   │   ├── templates/
│   │   │   │   ├── high_availability_config.j2
│   │   │   │   ├── local_repo_config.j2
│   │   │   │   ├── network_spec.j2
│   │   │   │   ├── omnia_config.j2
│   │   │   │   ├── omnia_config_credentials.yml.j2
│   │   │   │   ├── provision_config.j2
│   │   │   │   ├── storage_config.j2
│   │   │   │   └── telemetry_config.j2
│   │   │   └── vars/
│   │   │       └── main.yml
│   │   ├── upgrade_cluster/
│   │   │   ├── tasks/
│   │   │   │   └── main.yml
│   │   │   └── vars/
│   │   │       └── main.yml
│   │   └── upgrade_oim/
│   │       ├── tasks/
│   │       │   └── main.yml
│   │       └── vars/
│   │           └── main.yml
│   ├── rollback_omnia.yml
│   ├── upgrade_cluster.yml
│   ├── upgrade_oim.yml
│   └── upgrade_omnia.yml
└── utils/
    ├── ansible.cfg
    ├── create_container_group.yml
    ├── credential_utility/
    │   ├── ansible.cfg
    │   ├── get_config_credentials.yml
    │   └── roles/
    │       ├── create_config/
    │       │   ├── tasks/
    │       │   │   ├── create_credential_file.yml
    │       │   │   └── main.yml
    │       │   ├── templates/
    │       │   │   ├── build_stream_credential.j2
    │       │   │   └── omnia_credential.j2
    │       │   └── vars/
    │       │       └── main.yml
    │       ├── update_config/
    │       │   ├── tasks/
    │       │   │   ├── credential_status.yml
    │       │   │   ├── fetch_conditional_mandatory_credentials.yml
    │       │   │   ├── fetch_credentials.yml
    │       │   │   ├── fetch_mandatory_credentials.yml
    │       │   │   ├── fetch_optional_credentials.yml
    │       │   │   ├── main.yml
    │       │   │   ├── prompt_credentials.yml
    │       │   │   ├── prompt_password.yml
    │       │   │   ├── prompt_username.yml
    │       │   │   ├── update_bs_credential_file.yml
    │       │   │   └── update_credentials.yml
    │       │   └── vars/
    │       │       └── main.yml
    │       └── validation/
    │           ├── tasks/
    │           │   ├── main.yml
    │           │   ├── pre_requisite.yml
    │           │   └── validate_cred_file.yml
    │           └── vars/
    │               └── main.yml
    ├── external_kafka_connect_details.yml
    ├── external_victoria_connect_details.yml
    ├── generate_functional_groups.yml
    ├── include_input_dir.yml
    ├── oim_cleanup.yml
    ├── roles/
    │   ├── common/
    │   │   ├── tasks/
    │   │   │   ├── include_omnia_config.yml
    │   │   │   ├── include_omnia_config_credentials.yml
    │   │   │   └── main.yml
    │   │   └── vars/
    │   │       └── main.yml
    │   ├── create_container_group/
    │   │   ├── tasks/
    │   │   │   └── main.yml
    │   │   └── vars/
    │   │       └── main.yml
    │   ├── external_kafka_connect_details/
    │   │   ├── tasks/
    │   │   │   └── main.yml
    │   │   └── vars/
    │   │       └── main.yml
    │   ├── external_victoria_connect_details/
    │   │   ├── tasks/
    │   │   │   └── main.yml
    │   │   └── vars/
    │   │       └── main.yml
    │   ├── generate_functional_groups/
    │   │   ├── tasks/
    │   │   │   └── main.yml
    │   │   └── vars/
    │   │       └── main.yml
    │   ├── idrac_pxe_boot/
    │   │   ├── tasks/
    │   │   │   └── main.yml
    │   │   └── vars/
    │   │       └── main.yml
    │   ├── include_input_dir/
    │   │   ├── tasks/
    │   │   │   └── main.yml
    │   │   └── vars/
    │   │       └── main.yml
    │   ├── oim_cleanup/
    │   │   ├── oim_container_cleanup/
    │   │   │   ├── tasks/
    │   │   │   │   ├── cleanup_auth.yml
    │   │   │   │   ├── cleanup_build_stream.yml
    │   │   │   │   ├── cleanup_common.yml
    │   │   │   │   ├── cleanup_note.yml
    │   │   │   │   ├── cleanup_omnia_postgres.yml
    │   │   │   │   ├── cleanup_openchami.yml
    │   │   │   │   ├── cleanup_pulp.yml
    │   │   │   │   └── main.yml
    │   │   │   └── vars/
    │   │   │       └── main.yml
    │   │   ├── omnia_credential_cleanup/
    │   │   │   ├── tasks/
    │   │   │   │   ├── cleanup_credentials.yml
    │   │   │   │   └── main.yml
    │   │   │   └── vars/
    │   │   │       └── main.yml
    │   │   └── pre_requisite/
    │   │       ├── tasks/
    │   │       │   ├── main.yml
    │   │       │   └── pre_requisite.yml
    │   │       └── vars/
    │   │           └── main.yml
    │   ├── slurm_cleanup/
    │   │   ├── defaults/
    │   │   │   └── main.yml
    │   │   └── tasks/
    │   │       └── main.yml
    │   ├── slurm_config_backup/
    │   │   ├── defaults/
    │   │   │   └── main.yml
    │   │   └── tasks/
    │   │       └── main.yml
    │   └── slurm_config_rollback/
    │       ├── defaults/
    │       │   └── main.yml
    │       └── tasks/
    │           └── main.yml
    ├── set_pxe_boot.yml
    ├── slurm_config_util.yml
    └── upgrade_checkup.yml

================================================
FILE CONTENTS
================================================

================================================
FILE: .all-contributorsrc
================================================
{
  "files": [
    "README.md"
  ],
  "imageSize": 100,
  "commit": false,
  "badgeTemplate": "<!-- DO NOT ADD A BADGE -->",
  "contributors": [
    {
      "login": "j0hnL",
      "name": "John Lockman",
      "avatar_url": "https://avatars.githubusercontent.com/u/912987?v=4",
      "profile": "http://johnlockman.com",
      "contributions": [
        "test",
        "code",
        "blog",
        "ideas",
        "maintenance",
        "mentoring",
        "design",
        "review",
        "talk",
        "bug"
      ]
    },
    {
      "login": "lwilson",
      "name": "Lucas A. Wilson",
      "avatar_url": "https://avatars.githubusercontent.com/u/1236922?v=4",
      "profile": "https://github.com/lwilson",
      "contributions": [
        "code",
        "design",
        "maintenance",
        "ideas",
        "blog",
        "doc",
        "mentoring",
        "projectManagement",
        "review",
        "talk",
        "bug"
      ]
    },
    {
      "login": "sujit-jadhav",
      "name": "Sujit Jadhav",
      "avatar_url": "https://avatars.githubusercontent.com/u/73123831?v=4",
      "profile": "https://github.com/sujit-jadhav",
      "contributions": [
        "ideas",
        "doc",
        "code",
        "review",
        "maintenance",
        "projectManagement",
        "mentoring",
        "talk",
        "question",
        "test",
        "bug"
      ]
    },
    {
      "login": "DeepikaKrishnaiah",
      "name": "Deepika K",
      "avatar_url": "https://avatars.githubusercontent.com/u/73213880?v=4",
      "profile": "https://github.com/DeepikaKrishnaiah",
      "contributions": [
        "code",
        "test",
        "bug",
        "security",
        "talk",
        "review",
        "mentoring"
      ]
    },
    {
      "login": "abhishek-sa1",
      "name": "Abhishek SA",
      "avatar_url": "https://avatars.githubusercontent.com/u/94038029?v=4",
      "profile": "https://github.com/abhishek-sa1",
      "contributions": [
        "code",
        "bug",
        "doc",
        "test",
        "maintenance",
        "talk",
        "mentoring",
        "review"
      ]
    },
    {
      "login": "sakshiarora13",
      "name": "Sakshi Arora",
      "avatar_url": "https://avatars.githubusercontent.com/u/73195862?v=4",
      "profile": "https://github.com/sakshiarora13",
      "contributions": [
        "code",
        "bug",
        "talk"
      ]
    },
    {
      "login": "Shubhangi-dell",
      "name": "Shubhangi Srivastava",
      "avatar_url": "https://avatars.githubusercontent.com/u/72869337?v=4",
      "profile": "https://github.com/Shubhangi-dell",
      "contributions": [
        "code",
        "maintenance",
        "bug",
        "talk"
      ]
    },
    {
      "login": "cgoveas",
      "name": "Cassey Goveas",
      "avatar_url": "https://avatars.githubusercontent.com/u/88071888?v=4",
      "profile": "https://github.com/cgoveas",
      "contributions": [
        "doc",
        "bug",
        "maintenance",
        "talk"
      ]
    },
    {
      "login": "Khushboodholi",
      "name": "Khushboo Dholi",
      "avatar_url": "https://avatars.githubusercontent.com/u/12014935?v=4",
      "profile": "https://github.com/Khushboodholi",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "prasoon-sinha",
      "name": "Prasoon Kumar Sinha",
      "avatar_url": "https://avatars.githubusercontent.com/u/5362594?v=4",
      "profile": "https://github.com/prasoon-sinha",
      "contributions": [
        "ideas",
        "talk",
        "mentoring"
      ]
    },
    {
      "login": "SajithDas",
      "name": "SajithDas",
      "avatar_url": "https://avatars.githubusercontent.com/u/78676226?v=4",
      "profile": "https://github.com/SajithDas",
      "contributions": [
        "projectManagement",
        "talk"
      ]
    },
    {
      "login": "i3igpete",
      "name": "i3igpete",
      "avatar_url": "https://avatars.githubusercontent.com/u/33877827?v=4",
      "profile": "https://github.com/i3igpete",
      "contributions": [
        "business",
        "talk"
      ]
    },
    {
      "login": "renzo-granados",
      "name": "renzo-granados",
      "avatar_url": "https://avatars.githubusercontent.com/u/83035817?v=4",
      "profile": "https://github.com/renzo-granados",
      "contributions": [
        "bug"
      ]
    },
    {
      "login": "Aditya-DP",
      "name": "Aditya-DP",
      "avatar_url": "https://avatars.githubusercontent.com/u/115771515?v=4",
      "profile": "https://github.com/Aditya-DP",
      "contributions": [
        "code",
        "bug",
        "test"
      ]
    },
    {
      "login": "Katakam-Rakesh",
      "name": "Katakam Rakesh Naga Sai",
      "avatar_url": "https://avatars.githubusercontent.com/u/125246792?v=4",
      "profile": "https://github.com/Katakam-Rakesh",
      "contributions": [
        "code",
        "bug",
        "test"
      ]
    },
    {
      "login": "araji",
      "name": "araji",
      "avatar_url": "https://avatars.githubusercontent.com/u/216020?v=4",
      "profile": "https://github.com/araji",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "mikerenfro",
      "name": "Mike Renfro",
      "avatar_url": "https://avatars.githubusercontent.com/u/1451881?v=4",
      "profile": "https://mike.renf.ro/blog/",
      "contributions": [
        "doc"
      ]
    },
    {
      "login": "leereyno-asu",
      "name": "Lee Reynolds",
      "avatar_url": "https://avatars.githubusercontent.com/u/81774548?v=4",
      "profile": "https://github.com/leereyno-asu",
      "contributions": [
        "code",
        "doc",
        "tutorial"
      ]
    },
    {
      "login": "blesson-james",
      "name": "blesson-james",
      "avatar_url": "https://avatars.githubusercontent.com/u/72782936?v=4",
      "profile": "https://github.com/blesson-james",
      "contributions": [
        "code",
        "test",
        "bug"
      ]
    },
    {
      "login": "avinashvishwanath",
      "name": "avinashvishwanath",
      "avatar_url": "https://avatars.githubusercontent.com/u/77823538?v=4",
      "profile": "https://github.com/avinashvishwanath",
      "contributions": [
        "doc"
      ]
    },
    {
      "login": "abhishek-s-a",
      "name": "abhishek-s-a",
      "avatar_url": "https://avatars.githubusercontent.com/u/73212230?v=4",
      "profile": "https://github.com/abhishek-s-a",
      "contributions": [
        "code",
        "doc",
        "test"
      ]
    },
    {
      "login": "Franklin-Johnson",
      "name": "Franklin-Johnson",
      "avatar_url": "https://avatars.githubusercontent.com/u/84760103?v=4",
      "profile": "https://github.com/Franklin-Johnson",
      "contributions": [
        "code",
        "blog"
      ]
    },
    {
      "login": "teiland7",
      "name": "teiland7",
      "avatar_url": "https://avatars.githubusercontent.com/u/85184708?v=4",
      "profile": "https://github.com/teiland7",
      "contributions": [
        "code",
        "blog"
      ]
    },
    {
      "login": "VishnupriyaKrish",
      "name": "VishnupriyaKrish",
      "avatar_url": "https://avatars.githubusercontent.com/u/72784834?v=4",
      "profile": "https://github.com/VishnupriyaKrish",
      "contributions": [
        "code",
        "test"
      ]
    },
    {
      "login": "ishitadatta",
      "name": "Ishita Datta",
      "avatar_url": "https://avatars.githubusercontent.com/u/48859631?v=4",
      "profile": "https://rb.gy/ndlbhv",
      "contributions": [
        "doc"
      ]
    },
    {
      "login": "asu-wdizon",
      "name": "William Dizon",
      "avatar_url": "https://avatars.githubusercontent.com/u/81772355?v=4",
      "profile": "https://github.com/asu-wdizon",
      "contributions": [
        "tutorial"
      ]
    },
    {
      "login": "bssitton-BU",
      "name": "bssitton-BU",
      "avatar_url": "https://avatars.githubusercontent.com/u/14130464?v=4",
      "profile": "https://github.com/bssitton-BU",
      "contributions": [
        "bug"
      ]
    },
    {
      "login": "hearnsj",
      "name": "John Hearns",
      "avatar_url": "https://avatars.githubusercontent.com/u/19259589?v=4",
      "profile": "https://github.com/hearnsj",
      "contributions": [
        "bug"
      ]
    },
    {
      "login": "kbuggenhout",
      "name": "kris buggenhout",
      "avatar_url": "https://avatars.githubusercontent.com/u/30471699?v=4",
      "profile": "https://github.com/kbuggenhout",
      "contributions": [
        "bug"
      ]
    },
    {
      "login": "jiad-vmware",
      "name": "jiad-vmware",
      "avatar_url": "https://avatars.githubusercontent.com/u/68653329?v=4",
      "profile": "https://github.com/jiad-vmware",
      "contributions": [
        "bug"
      ]
    },
    {
      "login": "jlec",
      "name": "Justin Lecher",
      "avatar_url": "https://avatars.githubusercontent.com/u/79732?v=4",
      "profile": "https://jlec.de",
      "contributions": [
        "ideas"
      ]
    },
    {
      "login": "Kavyabr23",
      "name": "Kavyabr23",
      "avatar_url": "https://avatars.githubusercontent.com/u/90390587?v=4",
      "profile": "https://github.com/Kavyabr23",
      "contributions": [
        "code",
        "test"
      ]
    },
    {
      "login": "vedaprakashanp",
      "name": "vedaprakashanp",
      "avatar_url": "https://avatars.githubusercontent.com/u/90596073?v=4",
      "profile": "https://github.com/vedaprakashanp",
      "contributions": [
        "test",
        "code"
      ]
    },
    {
      "login": "Bhagyashree-shetty",
      "name": "Bhagyashree-shetty",
      "avatar_url": "https://avatars.githubusercontent.com/u/90620926?v=4",
      "profile": "https://github.com/Bhagyashree-shetty",
      "contributions": [
        "test",
        "code"
      ]
    },
    {
      "login": "nihalranjan-hpc",
      "name": "Nihal Ranjan",
      "avatar_url": "https://avatars.githubusercontent.com/u/84398828?v=4",
      "profile": "https://github.com/nihalranjan-hpc",
      "contributions": [
        "test",
        "code",
        "talk",
        "bug"
      ]
    },
    {
      "login": "ptrinesh",
      "name": "ptrinesh",
      "avatar_url": "https://avatars.githubusercontent.com/u/73214211?v=4",
      "profile": "https://github.com/ptrinesh",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "eltociear",
      "name": "Ikko Ashimine",
      "avatar_url": "https://avatars.githubusercontent.com/u/22633385?v=4",
      "profile": "https://bandism.net/",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "Lakshmi-Patneedi",
      "name": "Lakshmi-Patneedi",
      "avatar_url": "https://avatars.githubusercontent.com/u/94051091?v=4",
      "profile": "https://github.com/Lakshmi-Patneedi",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "Artlands",
      "name": "Jie Li",
      "avatar_url": "https://avatars.githubusercontent.com/u/31781106?v=4",
      "profile": "https://github.com/Artlands",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "githubyongchen",
      "name": "Yong Chen",
      "avatar_url": "https://avatars.githubusercontent.com/u/5414112?v=4",
      "profile": "https://github.com/githubyongchen",
      "contributions": [
        "design"
      ]
    },
    {
      "login": "Zipexpo",
      "name": "nvtngan",
      "avatar_url": "https://avatars.githubusercontent.com/u/18387748?v=4",
      "profile": "http://www.myweb.ttu.edu/ngu00336/",
      "contributions": [
        "code",
        "plugin"
      ]
    },
    {
      "login": "tamilarasansubrama1",
      "name": "tamilarasansubrama1",
      "avatar_url": "https://avatars.githubusercontent.com/u/100588942?v=4",
      "profile": "https://github.com/tamilarasansubrama1",
      "contributions": [
        "test",
        "code"
      ]
    },
    {
      "login": "shemasr",
      "name": "shemasr",
      "avatar_url": "https://avatars.githubusercontent.com/u/100141664?v=4",
      "profile": "https://github.com/shemasr",
      "contributions": [
        "bug",
        "code",
        "test"
      ]
    },
    {
      "login": "naresh3774",
      "name": "Naresh Sharma",
      "avatar_url": "https://avatars.githubusercontent.com/u/101410892?v=4",
      "profile": "https://github.com/naresh3774",
      "contributions": [
        "bug"
      ]
    },
    {
      "login": "JonHass",
      "name": "Jon Hass",
      "avatar_url": "https://avatars.githubusercontent.com/u/6976486?v=4",
      "profile": "https://github.com/JonHass",
      "contributions": [
        "doc",
        "design"
      ]
    },
    {
      "login": "KalyanKonatham",
      "name": "KalyanKonatham",
      "avatar_url": "https://avatars.githubusercontent.com/u/101596828?v=4",
      "profile": "https://github.com/KalyanKonatham",
      "contributions": [
        "bug"
      ]
    },
    {
      "login": "rahulakolkar",
      "name": "Rahul Akolkar",
      "avatar_url": "https://avatars.githubusercontent.com/u/22768133?v=4",
      "profile": "https://github.com/rahulakolkar",
      "contributions": [
        "bug"
      ]
    },
    {
      "login": "srinandini-karumuri",
      "name": "srinandini-karumuri",
      "avatar_url": "https://avatars.githubusercontent.com/u/104345504?v=4",
      "profile": "https://github.com/srinandini-karumuri",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "Rishabhm47",
      "name": "Rishabhm47",
      "avatar_url": "https://avatars.githubusercontent.com/u/106973551?v=4",
      "profile": "https://github.com/Rishabhm47",
      "contributions": [
        "test",
        "code"
      ]
    },
    {
      "login": "vaishakh-pm",
      "name": "vaishakh-pm",
      "avatar_url": "https://avatars.githubusercontent.com/u/104622022?v=4",
      "profile": "https://github.com/vaishakh-pm",
      "contributions": [
        "test",
        "code"
      ]
    },
    {
      "login": "shridhar-sharma",
      "name": "shridhar-sharma",
      "avatar_url": "https://avatars.githubusercontent.com/u/104621992?v=4",
      "profile": "https://github.com/shridhar-sharma",
      "contributions": [
        "test",
        "code",
        "bug"
      ]
    },
    {
      "login": "JayaDayyala",
      "name": "Jaya.Dayyala",
      "avatar_url": "https://avatars.githubusercontent.com/u/108455487?v=4",
      "profile": "https://github.com/JayaDayyala",
      "contributions": [
        "test",
        "code"
      ]
    },
    {
      "login": "fasongan",
      "name": "fasongan",
      "avatar_url": "https://avatars.githubusercontent.com/u/16153657?v=4",
      "profile": "https://github.com/fasongan",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "rahuldell21",
      "name": "rahuldell21",
      "avatar_url": "https://avatars.githubusercontent.com/u/117621375?v=4",
      "profile": "https://github.com/rahuldell21",
      "contributions": [
        "code",
        "test"
      ]
    },
    {
      "login": "diptiman12",
      "name": "diptiman12",
      "avatar_url": "https://avatars.githubusercontent.com/u/117987073?v=4",
      "profile": "https://github.com/diptiman12",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "SupriyaParthasarathy",
      "name": "Supriya Parthasarathy",
      "avatar_url": "https://avatars.githubusercontent.com/u/139955493?v=4",
      "profile": "https://github.com/SupriyaParthasarathy",
      "contributions": [
        "projectManagement"
      ]
    },
    {
      "login": "Subhankar-Adak",
      "name": "Subhankar-Adak",
      "avatar_url": "https://avatars.githubusercontent.com/u/140381176?v=4",
      "profile": "https://github.com/Subhankar-Adak",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "priti-parate",
      "name": "priti-parate",
      "avatar_url": "https://avatars.githubusercontent.com/u/140157516?v=4",
      "profile": "https://github.com/priti-parate",
      "contributions": [
        "code",
        "bug",
        "talk",
        "mentoring",
        "review"
      ]
    },
    {
      "login": "lavanya5899",
      "name": "Lavanya Adhikari",
      "avatar_url": "https://avatars.githubusercontent.com/u/140372459?v=4",
      "profile": "https://github.com/lavanya5899",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "preeti-thankachan",
      "name": "preeti-thankachan",
      "avatar_url": "https://avatars.githubusercontent.com/u/141405483?v=4",
      "profile": "https://github.com/preeti-thankachan",
      "contributions": [
        "test",
        "bug"
      ]
    },
    {
      "login": "glimchb",
      "name": "Boris Glimcher",
      "avatar_url": "https://avatars.githubusercontent.com/u/36732377?v=4",
      "profile": "https://github.com/glimchb",
      "contributions": [
        "code",
        "maintenance",
        "doc"
      ]
    },
    {
      "login": "MoshiBin",
      "name": "Moshi Binyamini",
      "avatar_url": "https://avatars.githubusercontent.com/u/1297388?v=4",
      "profile": "https://github.com/MoshiBin",
      "contributions": [
        "code",
        "maintenance"
      ]
    },
    {
      "login": "paul-tp",
      "name": "paul-tp",
      "avatar_url": "https://avatars.githubusercontent.com/u/169248855?v=4",
      "profile": "https://github.com/paul-tp",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "Milisha-Gupta",
      "name": "Milisha Gupta",
      "avatar_url": "https://avatars.githubusercontent.com/u/52577117?v=4",
      "profile": "https://github.com/Milisha-Gupta",
      "contributions": [
        "code",
        "test"
      ]
    },
    {
      "login": "sakshi-singla-1735",
      "name": "sakshi-singla-1735",
      "avatar_url": "https://avatars.githubusercontent.com/u/169248923?v=4",
      "profile": "https://github.com/sakshi-singla-1735",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "Sankeerna-S",
      "name": "Sankeerna-S",
      "avatar_url": "https://avatars.githubusercontent.com/u/169250907?v=4",
      "profile": "https://github.com/Sankeerna-S",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "AjayKadoula",
      "name": "Ajay Kadoula",
      "avatar_url": "https://avatars.githubusercontent.com/u/38178003?v=4",
      "profile": "https://github.com/AjayKadoula",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "ShubhamKumar1996",
      "name": "ShubhamKumar1996",
      "avatar_url": "https://avatars.githubusercontent.com/u/51914136?v=4",
      "profile": "https://github.com/ShubhamKumar1996",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "SanthoshT2001",
      "name": "SanthoshT2001",
      "avatar_url": "https://avatars.githubusercontent.com/u/93521129?v=4",
      "profile": "https://github.com/SanthoshT2001",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "Kratika-P",
      "name": "Kratika-P",
      "avatar_url": "https://avatars.githubusercontent.com/u/169249531?v=4",
      "profile": "https://github.com/Kratika-P",
      "contributions": [
        "code",
        "test"
      ]
    },
    {
      "login": "sbasu96",
      "name": "Soumyadeep Basu",
      "avatar_url": "https://avatars.githubusercontent.com/u/162503707?v=4",
      "profile": "https://github.com/sbasu96",
      "contributions": [
        "doc"
      ]
    },
    {
      "login": "VrindaMarwah",
      "name": "VrindaMarwah",
      "avatar_url": "https://avatars.githubusercontent.com/u/169263232?v=4",
      "profile": "https://github.com/VrindaMarwah",
      "contributions": [
        "code",
        "test"
      ]
    },
    {
      "login": "Kevin-Kodama",
      "name": "Kevin-Kodama",
      "avatar_url": "https://avatars.githubusercontent.com/u/163032741?v=4",
      "profile": "https://github.com/Kevin-Kodama",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "balajikumaran-c-s",
      "name": "balajikumaran-c-s",
      "avatar_url": "https://avatars.githubusercontent.com/u/169248535?v=4",
      "profile": "https://github.com/balajikumaran-c-s",
      "contributions": [
        "code",
        "test",
        "bug",
        "code"
      ]
    },
    {
      "login": "Amogha-Reddy",
      "name": "Amogha-Reddy",
      "avatar_url": "https://avatars.githubusercontent.com/u/140503786?v=4",
      "profile": "https://github.com/Amogha-Reddy",
      "contributions": [
        "test",
        "bug",
        "code"
      ]
    },
    {
      "login": "krsandeepit",
      "name": "krsandeepit",
      "avatar_url": "https://avatars.githubusercontent.com/u/162142649?v=4",
      "profile": "https://github.com/krsandeepit",
      "contributions": [
        "test",
        "bug"
      ]
    },
    {
      "login": "Yash-shetty1",
      "name": "Yash-shetty1",
      "avatar_url": "https://avatars.githubusercontent.com/u/169258785?v=4",
      "profile": "https://github.com/Yash-shetty1",
      "contributions": [
        "test",
        "bug"
      ]
    },
    {
      "login": "nethramg",
      "name": "Nethravathi M G",
      "avatar_url": "https://avatars.githubusercontent.com/u/146437298?v=4",
      "profile": "https://github.com/nethramg",
      "contributions": [
        "code",
        "projectManagement",
        "talk"
      ]
    },
    {
      "login": "AbdulRijwan",
      "name": "Abdul Rijwan",
      "avatar_url": "https://avatars.githubusercontent.com/u/170396052?v=4",
      "profile": "https://github.com/AbdulRijwan",
      "contributions": [
        "infra"
      ]
    },
    {
      "login": "dweineha",
      "name": "David Weinehall",
      "avatar_url": "https://avatars.githubusercontent.com/u/42206500?v=4",
      "profile": "https://github.com/dweineha",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "VenkateswaraVatam",
      "name": "Venkateswara Vatam",
      "avatar_url": "https://avatars.githubusercontent.com/u/153504816?v=4",
      "profile": "https://github.com/VenkateswaraVatam",
      "contributions": [
        "projectManagement",
        "talk"
      ]
    },
    {
      "login": "snarthan",
      "name": "Narthan S",
      "avatar_url": "https://avatars.githubusercontent.com/u/171680285?v=4",
      "profile": "https://github.com/snarthan",
      "contributions": [
        "code",
        "mentoring",
        "review"
      ]
    },
    {
      "login": "suman-square",
      "name": "Suman S",
      "avatar_url": "https://avatars.githubusercontent.com/u/178771071?v=4",
      "profile": "https://github.com/suman-square",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "gurump21",
      "name": "Prabhu Gurumurthy",
      "avatar_url": "https://avatars.githubusercontent.com/u/189354746?v=4",
      "profile": "https://github.com/gurump21",
      "contributions": [
        "bug"
      ]
    },
    {
      "login": "Nagachandan-P",
      "name": "Nagachandan P",
      "avatar_url": "https://avatars.githubusercontent.com/Nagachandan-P",
      "profile": "https://github.com/Nagachandan-P",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "pranavkumar74980",
      "name": "Pranav kumar",
      "avatar_url": "https://avatars.githubusercontent.com/pranavkumar74980",
      "profile": "https://github.com/pranavkumar74980",
      "contributions": [
        "code",
        "test"
      ]
    },
    {
      "login": "aditi-sharma27",
      "name": "Aditi Sharma",
      "avatar_url": "https://avatars.githubusercontent.com/aditi-sharma27",
      "profile": "https://github.com/aditi-sharma27",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "Rohith-Ravut",
      "name": "Rohith-Ravut",
      "avatar_url": "https://avatars.githubusercontent.com/u/196186062?v=4",
      "profile": "https://github.com/Rohith-Ravut",
      "contributions": [
        "test",
        "bug",
        "code"
      ]
    },
    {
      "login": "RvishankarOMnia",
      "name": "RvishankarOMnia",
      "avatar_url": "https://avatars.githubusercontent.com/u/186007052?v=4",
      "profile": "https://github.com/RvishankarOMnia",
      "contributions": [
        "ideas",
        "talk",
        "mentoring"
      ]
    },
    {
      "login": "jagadeeshnv",
      "name": "Jagadeesh N V",
      "avatar_url": "https://avatars.githubusercontent.com/u/39791839?v=4",
      "profile": "https://github.com/jagadeeshnv",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "sourabh-sahu1",
      "name": "sourabh-sahu1",
      "avatar_url": "https://avatars.githubusercontent.com/u/196315600?v=4",
      "profile": "https://github.com/sourabh-sahu1",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "ghandoura",
      "name": "Adam Ghandoura",
      "avatar_url": "https://avatars.githubusercontent.com/u/87424850?v=4",
      "profile": "https://github.com/ghandoura",
      "contributions": [
        "test",
        "code"
      ]
    },
    {
      "login": "Coleman-Trader",
      "name": "Coleman-Trader",
      "avatar_url": "https://avatars.githubusercontent.com/u/196217244?v=4",
      "profile": "https://github.com/Coleman-Trader",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "youngjae-hur7",
      "name": "youngjae-hur7",
      "avatar_url": "https://avatars.githubusercontent.com/u/196205015?v=4",
      "profile": "https://github.com/youngjae-hur7",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "Grace-Chang2",
      "name": "Grace-Chang2",
      "avatar_url": "https://avatars.githubusercontent.com/u/196347461?v=4",
      "profile": "https://github.com/Grace-Chang2",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "Cypher-Miller",
      "name": "Cypher-Miller",
      "avatar_url": "https://avatars.githubusercontent.com/u/123703182?v=4",
      "profile": "https://github.com/Cypher-Miller",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "vvittal100",
      "name": "vvittal100",
      "avatar_url": "https://avatars.githubusercontent.com/u/202238575?v=4",
      "profile": "https://github.com/vvittal100",
      "contributions": [
        "projectManagement",
        "talk"
      ]
    },
    {
      "login": "kksenthilkumar",
      "name": "kksenthilkumar",
      "avatar_url": "https://avatars.githubusercontent.com/u/202253529?v=4",
      "profile": "https://github.com/kksenthilkumar",
      "contributions": [
        "test"
      ]
    },
    {
      "login": "pullan1",
      "name": "pullan1",
      "avatar_url": "https://avatars.githubusercontent.com/u/173048662?v=4",
      "profile": "https://github.com/pullan1",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "harshal2799",
      "name": "harshal2799",
      "avatar_url": "https://avatars.githubusercontent.com/u/202241497?v=4",
      "profile": "https://github.com/harshal2799",
      "contributions": [
        "test"
      ]
    },
    {
      "login": "Sindhu-Ranganath",
      "name": "Sindhu-Ranganath",
      "avatar_url": "https://avatars.githubusercontent.com/u/208789597?v=4",
      "profile": "https://github.com/Sindhu-Ranganath",
      "contributions": [
        "test"
      ]
    },
    {
      "login": "Manasa-Hemmanur",
      "name": "Manasa H",
      "avatar_url": "https://avatars.githubusercontent.com/u/205002578?v=4",
      "profile": "https://github.com/Manasa-Hemmanur",
      "contributions": [
        "code",
        "test"
      ]
    },
    {
      "login": "Diya-Sumod",
      "name": "Diya-Sumod",
      "avatar_url": "https://avatars.githubusercontent.com/u/225136254?v=4",
      "profile": "https://github.com/Diya-Sumod",
      "contributions": [
        "code",
        "test"
      ]
    },
    {
      "login": "Tanmay-Raj1004",
      "name": "Tanmay-Raj1004",
      "avatar_url": "https://avatars.githubusercontent.com/u/227950687?v=4",
      "profile": "https://github.com/Tanmay-Raj1004",
      "contributions": [
        "code",
        "test"
      ]
    },
    {
      "login": "Anurag-Bijalwan",
      "name": "Anurag-Bijalwan",
      "avatar_url": "https://avatars.githubusercontent.com/u/218922922?v=4",
      "profile": "https://github.com/Anurag-Bijalwan",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "SOWJANYAJAGADISH123",
      "name": "SOWJANYAJAGADISH123",
      "avatar_url": "https://avatars.githubusercontent.com/u/257989626?v=4",
      "profile": "https://github.com/SOWJANYAJAGADISH123",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "mithileshreddy04",
      "name": "mithileshreddy04",
      "avatar_url": "https://avatars.githubusercontent.com/u/258000200?v=4",
      "profile": "https://github.com/mithileshreddy04",
      "contributions": [
        "code"
      ]
    },
    {
      "login": "Rajeshkumar-s2",
      "name": "Rajeshkumar-s2",
      "avatar_url": "https://avatars.githubusercontent.com/u/242588082?v=4",
      "profile": "https://github.com/Rajeshkumar-s2",
      "contributions": [
        "code",
        "test"
      ]
    },
    {
      "login": "Venu-p1",
      "name": "Venu-p1",
      "avatar_url": "https://avatars.githubusercontent.com/u/236371043?v=4",
      "profile": "https://github.com/Venu-p1",
      "contributions": [
        "code",
        "test"
      ]
    }
  ],
  "contributorsPerLine": 7,
  "projectName": "omnia",
  "projectOwner": "dell",
  "repoType": "github",
  "repoHost": "https://github.com",
  "skipCi": true,
  "commitConvention": "angular",
  "commitType": "docs"
}


================================================
FILE: .ansible-lint
================================================
skip_list:
  - var-naming[no-role-prefix]
  - unresolved-module
  - fqcn[canonical]
  - internal-error
  - role-name[path]


================================================
FILE: .config/ansible-lint.yml
================================================
---
exclude_paths:
  - .git/
  - .github/
  - accelerator/tests/
  - network/tests/
  - provision/tests/
  - scheduler/tests/
  - security/tests/
  - storage/tests/
  - test/
  - utils/obsolete/
  - docs/
  - platforms/
  - examples/
  - input/
  - .ansible-lint.yml
  - .readthedocs.yaml
  - prepare_oim/roles/configure_proxy/tasks/configure_proxy_rocky.yml
  - upgrade/roles/upgrade_idrac_telemetry/tasks/filter_idrac.yml
  - utils/server_spec_update/roles/os_update/tasks/kcmdline_update_rocky.yml
  - utils/roles/oim_cleanup/vars/rocky.yml
  - scheduler/roles/k8s_start_services/files/k8s_dashboard_admin.yaml
  - scheduler/playbooks/k8s_add_node.yml
  - "*ubuntu*"
  - "*rocky*"

skip_list:
  - var-naming
  - unresolved-module
  - fqcn[canonical]
  - internal-error
  - role-name[path]

verbosity: 1
profile: production


================================================
FILE: .config/requirements.yml
================================================
---
collections:
  - name: kubernetes.core
    version: 5.0.0
  - name: ansible.utils
    version: 5.1.1
  - name: community.crypto
    version: 2.23.0
  - name: community.docker
    version: 3.12.1
  - name: community.general
    version: 10.3.0
  - name: community.grafana
    version: 2.1.0
  - name: community.mysql
    version: 3.10.3
  - name: dellemc.os10
    version: 1.1.1
  - name: dellemc.openmanage
    version: 9.6.0
  - name: ansible.posix
    version: 2.0.0
  - name: containers.podman
    version: 1.16.2
  - name: community.postgresql
    version: 3.10.2


================================================
FILE: .gitattributes
================================================
*.yml linguist-detectable
*.tar.gz filter=lfs diff=lfs merge=lfs -text


================================================
FILE: .github/ISSUE_TEMPLATE/bug_report.md
================================================
---
name: Bug report
about: Create a report to help us improve
title: ''
Omnia Version: ''
labels: bug
assignees: ''

---

**Describe the bug**
A clear and concise description of what the bug is.

**To Reproduce**
Steps to reproduce the behavior:
1. Go to '...'
2. Click on '....'
3. Scroll down to '....'
4. See error

**Expected behavior**
A clear and concise description of what you expected to happen.

**Screenshots**
If applicable, add screenshots to help explain your problem.

**Additional context**
Add any other context about the problem here.


================================================
FILE: .github/ISSUE_TEMPLATE/feature_request.md
================================================
---
name: Feature request
about: Suggest an idea for this project
title: ''
labels: 'enhancement'
assignees: ''

---

**Is your feature request related to a problem? Please describe.**
A clear and concise description of what the problem is. Ex. I'm always frustrated when [...]

**Describe the solution you'd like**
A clear and concise description of what you want to happen.

**Describe alternatives you've considered**
A clear and concise description of any alternative solutions or features you've considered.

**Additional context**
Add any other context or screenshots about the feature request here.


================================================
FILE: .github/ISSUE_TEMPLATE/logo_community.md
================================================
---
name: Add organization logo to the Omnia community list
about: Display your organization's logo on the Omnia website
title: 'Add logo to Omnia community list'
labels: 'logo'
assignees: ''

---

**Permanent link to your organization's logo:** 
_Please replace this text with a permanent URL to your organization's logo. Logos will be automatically resized to fit._


================================================
FILE: .github/branch-switcher.yml
================================================
preferredBranch: devel
switchComment: >
  Hey @{{author}}, the base branch of your pull request has been changed
  to {{preferredBranch}}. Have a nice day! :wave:


================================================
FILE: .github/pull_request_template.md
================================================
### Issues Resolved by this Pull Request
Please be sure to associate your pull request with one or more open issues. Use the word _Fixes_ as well as a hashtag (_#_) prior to the issue number in order to automatically resolve associated issues (e.g., _Fixes #100_).

Fixes #

### Description of the Solution
Please describe the solution provided and how it resolves the associated issues.

### Suggested Reviewers
If you wish to suggest specific reviewers for this solution, please include them in this section. Be sure to include the _@_ before the GitHub username.


================================================
FILE: .github/stale.yml
================================================
# Number of days of inactivity before an issue becomes stale
daysUntilStale: 60
# Number of days of inactivity before a stale issue is closed
daysUntilClose: 14
# Issues with these labels will never be considered stale
exemptLabels:
  - pinned
  - security
# Label to use when marking an issue as stale
staleLabel: stale
# Comment to post when marking an issue as stale. Set to `false` to disable
markComment: >
  This issue has been automatically marked as stale because it has not had
  recent activity. It will be closed if no further activity occurs. Thank you
  for your contributions.
# Comment to post when closing a stale issue. Set to `false` to disable
closeComment: false


================================================
FILE: .github/workflows/ansible-lint.yml
================================================
name: Ansible Lint

on:
  pull_request:
    branches:
      - main
      - staging
      - release_1.7.1
      - pub/build_stream
      - pub/v2.1_rc1
      - pub/q1_dev

jobs:
  build:
    name: Ansible Lint
    runs-on: ubuntu-latest
    steps:
      - name: Checkout repository
        uses: actions/checkout@v4

      - name: Set up Python
        uses: actions/setup-python@v4
        with:
          python-version: '3.x'

      - name: Install Ansible and Ansible Lint
        run: |
          python -m pip install --upgrade pip
          pip install ansible-core

      - name: Install Ansible Collections from requirements.yml
        run: |
          ansible-galaxy collection install -r .config/requirements.yml --force

      - name: Run ansible-lint
        uses: ansible/ansible-lint@main
        with:
          args: --config=.config/ansible-lint.yml


================================================
FILE: .github/workflows/pylint.yml
================================================
name: Pylint

on:
  pull_request:
    branches:
      - main
      - staging
      - release_1.7.1
      - pub/build_stream
      - pub/v2.1_rc1
      - pub/q1_dev

jobs:
  build:
    runs-on: ubuntu-latest
    strategy:
      matrix:
        python-version: ["3.11"]
    env:
      PYLINT_THRESHOLD: 8
    steps:
      - uses: actions/checkout@v4

      - name: Set up Python ${{ matrix.python-version }}
        uses: actions/setup-python@v3
        with:
          python-version: ${{ matrix.python-version }}

      - name: Install dependencies
        run: |
          python -m pip install --upgrade pip
          pip install ansible pylint kubernetes prettytable requests passlib fastapi uvicorn sqlalchemy pytest httpx argon2-cffi pyyaml dependency-injector

      - name: Get changed Python files (excluding deleted)
        id: changed-files
        run: |
          git fetch origin ${{ github.base_ref }}
          CHANGED=$(git diff --name-only --diff-filter=d origin/${{ github.base_ref }} HEAD -- '*.py' || true)

          FILES=""
          for f in $CHANGED; do
            if [ -f "$f" ]; then
              FILES="$FILES $f"
            fi
          done

          FILES=$(echo "$FILES" | xargs)  # Trim extra spaces

          echo "Filtered files: $FILES"
          echo "files=$FILES" >> "$GITHUB_OUTPUT"

      - name: Run pylint on changed files
        if: steps.changed-files.outputs.files != ''
        run: |
          echo "Running pylint on: ${{ steps.changed-files.outputs.files }}"
          
          # Filter out files from the excluded directory
          FILES=$(echo "${{ steps.changed-files.outputs.files }}" | tr ' ' '\n' | grep -v '^discovery/roles/telemetry/files/nersc-ldms-aggr/' | xargs)

          if [ -n "$FILES" ]; then
            # Set PYTHONPATH to include build_stream directory for proper import resolution
            # This allows pylint to resolve both relative imports in build_stream and regular imports elsewhere
            PYTHONPATH=.:./build_stream pylint $FILES --fail-under=${PYLINT_THRESHOLD}
          else
            echo "No files to lint after filtering."
          fi


================================================
FILE: .gitignore
================================================
/.idea/
/docs/build/
**/__pycache__/
.venv

================================================
FILE: .metadata/omnia_version
================================================
omnia_version: 2.0.0.0 
omnia_installation_path: ""


================================================
FILE: .readthedocs.yaml
================================================
# .readthedocs.yaml
# Read the Docs configuration file
# See https://docs.readthedocs.io/en/stable/config-file/v2.html for details

# Required
version: 2

# Set the version of Python and other tools you might need
build:
  os: ubuntu-22.04
  tools:
    python: "3.11"
    # You can also specify other tool versions:
    # nodejs: "19"
    # rust: "1.64"
    # golang: "1.19"

# Build documentation in the docs/ directory with Sphinx
sphinx:
  configuration: docs/source/conf.py

# If using Sphinx, optionally build your docs in additional formats such as PDF
formats:
   - epub
   - htmlzip

# Optionally declare the Python requirements required to build your docs
python:
  install:
    - requirements: docs/source/requirements.txt

================================================
FILE: CODE_OF_CONDUCT.md
================================================
# Contributor Covenant Code of Conduct

## Our Pledge

In the interest of fostering an open and welcoming environment, we as
contributors and maintainers pledge to making participation in our project and
our community a harassment-free experience for everyone, regardless of age, body
size, disability, ethnicity, sex characteristics, gender identity and expression,
level of experience, education, socio-economic status, nationality, personal
appearance, race, religion, or sexual identity and orientation.

## Our Standards

Examples of behavior that contributes to creating a positive environment
include:

* Using welcoming and inclusive language
* Being respectful of differing viewpoints and experiences
* Gracefully accepting constructive criticism
* Focusing on what is best for the community
* Showing empathy towards other community members

Examples of unacceptable behavior by participants include:

* The use of sexualized language or imagery and unwelcome sexual attention or
 advances
* Trolling, insulting/derogatory comments, and personal or political attacks
* Public or private harassment
* Publishing others' private information, such as a physical or electronic
 address, without explicit permission
* Other conduct which could reasonably be considered inappropriate in a
 professional setting

## Our Responsibilities

Project maintainers are responsible for clarifying the standards of acceptable
behavior and are expected to take appropriate and fair corrective action in
response to any instances of unacceptable behavior.

Project maintainers have the right and responsibility to remove, edit, or
reject comments, commits, code, wiki edits, issues, and other contributions
that are not aligned to this Code of Conduct, or to ban temporarily or
permanently any contributor for other behaviors that they deem inappropriate,
threatening, offensive, or harmful.

## Scope

This Code of Conduct applies both within project spaces and in public spaces
when an individual is representing the project or its community. Examples of
representing a project or community include using an official project e-mail
address, posting via an official social media account, or acting as an appointed
representative at an online or offline event. Representation of a project may be
further defined and clarified by project maintainers.

## Enforcement

Instances of abusive, harassing, or otherwise unacceptable behavior may be
reported by contacting the project team at luke_wilson@dell.com. All
complaints will be reviewed and investigated and will result in a response that
is deemed necessary and appropriate to the circumstances. The project team is
obligated to maintain confidentiality with regard to the reporter of an incident.
Further details of specific enforcement policies may be posted separately.

Project maintainers who do not follow or enforce the Code of Conduct in good
faith may face temporary or permanent repercussions as determined by other
members of the project's leadership.

## Attribution

This Code of Conduct is adapted from the [Contributor Covenant][homepage], version 1.4,
available at https://www.contributor-covenant.org/version/1/4/code-of-conduct.html

[homepage]: https://www.contributor-covenant.org

For answers to common questions about this code of conduct, see
https://www.contributor-covenant.org/faq


================================================
FILE: CONTRIBUTING.md
================================================
# CONTRIBUTE

## Introduction
We encourage everyone to help us improve Omnia by contributing to the project. Contributions can be as small as documentation updates or adding example use cases, to adding commenting or properly styling code segments, to full feature contributions. We ask that contributors follow our established guidelines for contributing to the project.

These guidelines are based on the [pravega project](https://github.com/pravega/pravega/).

This document will evolve as the project matures. Please be sure to regularly refer back in order to stay in-line with contribution guidelines.

## How to Contribute to Omnia
Contributions to Omnia are made through [Pull Requests (PRs)](https://help.github.com/en/github/collaborating-with-issues-and-pull-requests/about-pull-requests). To make a pull request against Omnia, use the following steps:

1. **Create an issue:** [Create an issue](https://help.github.com/en/github/managing-your-work-on-github/creating-an-issue) and describe what you are trying to solve. It does not matter whether it is a new feature, a bug fix, or an improvement. All pull requests need to be associated to an issue. When creating an issue, be sure to use the appropriate issue template (bug fix or feature request) and complete all of the required fields. If your issue does not fit in either a bug fix or feature request, then create a blank issue and be sure to including the following information:
   * **Problem description:** Describe what you believe needs to be addressed
   * **Problem location:** In which file and at what line does this issue occur?
   * **Suggested resolution:** How do you intend to resolve the problem?
2. **Create a personal fork:** All work on Omnia should be done in a [fork of the repository](https://help.github.com/en/github/getting-started-with-github/fork-a-repo). Only the maintiners are allowed to commit directly to the project repository.
3. **Issue branch:** [Create a new branch](https://help.github.com/en/desktop/contributing-to-projects/creating-a-branch-for-your-work) on your fork of the repository. All contributions should be branched from `devel`. Use `git checkout devel; git checkout -b <new-branch-name>` to create the new branch.
   * **Branch name:** The branch name should be based on the issue you are addressing. Use the following pattern to create your new branch name: issue-number, e.g., issue-1023.
4. **Commit changes to the issue branch:** It is important to commit your changes to the issue branch. Commit messages should be descriptive of the changes being made.
   * **Signing your commits:** All commits to Omnia need to be signed with the [Developer Certificate of Origin (DCO)](https://developercertificate.org/) in order to certify that the contributor has permission to contribute the code. In order to sign commits, use either the `--signoff` or `-s` option to `git commit`:
   ```
   git commit --signoff
   git commit -s
   ```
   Ensure you have your user name and e-mail set. The `--signoff | -s` option will use the configured user name and e-mail, so it is important to configure it before the first time you commit. Check the following references:

      * [Setting up your github user name](https://help.github.com/articles/setting-your-username-in-git/)
      * [Setting up your e-mail address](https://help.github.com/articles/setting-your-commit-email-address-in-git/)
   
5. **Push the changes to your personal repo:** To be able to create a pull request, push the changes to origin: `git push origin <new-branch-name>`. Here I assume that `origin` is your personal repo, e.g., `lwilson/omnia.git`.
6. **Create a pull request:** [Create a pull request](https://help.github.com/en/github/collaborating-with-issues-and-pull-requests/creating-a-pull-request) with a title following this format Issue ###: Description (_i.e., Issue 1023: Reformat testutils_). It is important that you do a good job with the description to make the job of the code reviewer easier. A good description not only reduces review time, but also reduces the probability of a misunderstanding with the pull request.
   * **Important:** When preparing a pull request it is important to stay up-to-date with the project repository. We recommend that you rebase against the upstream repo _frequently_. To do this, use the following commands:
   ```
   git pull --rebase upstream devel #upstream is dellhpc/omnia
   git push --force origin <pr-branch-name> #origin is your fork of the repository (e.g., <github_user_name>/omnia.git)
   ```
   * **PR Description:** Be sure to fully describe the pull request. Ideally, your PR description will contain:
      1. A description of the main point (_e.g., why was this PR made?_),
      2. Linking text to the related issue (_e.g., This PR closes issue #<issue_number>_),
      3. How the changes solves the problem, and
      4. How to verify that the changes work correctly.
   
## Omnia Branches and Contribution Flow
The diagram below describes the contribution flow. Omnia has two lifetime branches: `devel` and `release`. The `release` branch is reserved for releases and their associated tags. The `devel` branch is where all development work occurs. The `devel` branch is also the default branch for the project.

![Omnia Branch Flowchart](docs/source/images/omnia-branch-structure.png "Flowchart of Omnia branches")

## Developer Certificate of Origin
Contributions to Omnia must be signed with the [Developer Certificate of Origin (DCO)](https://developercertificate.org/):
```
Developer Certificate of Origin
Version 1.1

Copyright (C) 2004, 2006 The Linux Foundation and its contributors.
1 Letterman Drive
Suite D4700
San Francisco, CA, 94129

Everyone is permitted to copy and distribute verbatim copies of this
license document, but changing it is not allowed.


Developer's Certificate of Origin 1.1

By making a contribution to this project, I certify that:

(a) The contribution was created in whole or in part by me and I
    have the right to submit it under the open source license
    indicated in the file; or

(b) The contribution is based upon previous work that, to the best
    of my knowledge, is covered under an appropriate open source
    license and I have the right under that license to submit that
    work with modifications, whether created in whole or in part
    by me, under the same open source license (unless I am
    permitted to submit under a different license), as indicated
    in the file; or

(c) The contribution was provided directly to me by some other
    person who certified (a), (b) or (c) and I have not modified
    it.

(d) I understand and agree that this project and the contribution
    are public and that a record of the contribution (including all
    personal information I submit with it, including my sign-off) is
    maintained indefinitely and may be redistributed consistent with
    this project or the open source license(s) involved.
```


================================================
FILE: LICENSE
================================================
                                 Apache License
                           Version 2.0, January 2004
                        http://www.apache.org/licenses/

   TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION

   1. Definitions.

      "License" shall mean the terms and conditions for use, reproduction,
      and distribution as defined by Sections 1 through 9 of this document.

      "Licensor" shall mean the copyright owner or entity authorized by
      the copyright owner that is granting the License.

      "Legal Entity" shall mean the union of the acting entity and all
      other entities that control, are controlled by, or are under common
      control with that entity. For the purposes of this definition,
      "control" means (i) the power, direct or indirect, to cause the
      direction or management of such entity, whether by contract or
      otherwise, or (ii) ownership of fifty percent (50%) or more of the
      outstanding shares, or (iii) beneficial ownership of such entity.

      "You" (or "Your") shall mean an individual or Legal Entity
      exercising permissions granted by this License.

      "Source" form shall mean the preferred form for making modifications,
      including but not limited to software source code, documentation
      source, and configuration files.

      "Object" form shall mean any form resulting from mechanical
      transformation or translation of a Source form, including but
      not limited to compiled object code, generated documentation,
      and conversions to other media types.

      "Work" shall mean the work of authorship, whether in Source or
      Object form, made available under the License, as indicated by a
      copyright notice that is included in or attached to the work
      (an example is provided in the Appendix below).

      "Derivative Works" shall mean any work, whether in Source or Object
      form, that is based on (or derived from) the Work and for which the
      editorial revisions, annotations, elaborations, or other modifications
      represent, as a whole, an original work of authorship. For the purposes
      of this License, Derivative Works shall not include works that remain
      separable from, or merely link (or bind by name) to the interfaces of,
      the Work and Derivative Works thereof.

      "Contribution" shall mean any work of authorship, including
      the original version of the Work and any modifications or additions
      to that Work or Derivative Works thereof, that is intentionally
      submitted to Licensor for inclusion in the Work by the copyright owner
      or by an individual or Legal Entity authorized to submit on behalf of
      the copyright owner. For the purposes of this definition, "submitted"
      means any form of electronic, verbal, or written communication sent
      to the Licensor or its representatives, including but not limited to
      communication on electronic mailing lists, source code control systems,
      and issue tracking systems that are managed by, or on behalf of, the
      Licensor for the purpose of discussing and improving the Work, but
      excluding communication that is conspicuously marked or otherwise
      designated in writing by the copyright owner as "Not a Contribution."

      "Contributor" shall mean Licensor and any individual or Legal Entity
      on behalf of whom a Contribution has been received by Licensor and
      subsequently incorporated within the Work.

   2. Grant of Copyright License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      copyright license to reproduce, prepare Derivative Works of,
      publicly display, publicly perform, sublicense, and distribute the
      Work and such Derivative Works in Source or Object form.

   3. Grant of Patent License. Subject to the terms and conditions of
      this License, each Contributor hereby grants to You a perpetual,
      worldwide, non-exclusive, no-charge, royalty-free, irrevocable
      (except as stated in this section) patent license to make, have made,
      use, offer to sell, sell, import, and otherwise transfer the Work,
      where such license applies only to those patent claims licensable
      by such Contributor that are necessarily infringed by their
      Contribution(s) alone or by combination of their Contribution(s)
      with the Work to which such Contribution(s) was submitted. If You
      institute patent litigation against any entity (including a
      cross-claim or counterclaim in a lawsuit) alleging that the Work
      or a Contribution incorporated within the Work constitutes direct
      or contributory patent infringement, then any patent licenses
      granted to You under this License for that Work shall terminate
      as of the date such litigation is filed.

   4. Redistribution. You may reproduce and distribute copies of the
      Work or Derivative Works thereof in any medium, with or without
      modifications, and in Source or Object form, provided that You
      meet the following conditions:

      (a) You must give any other recipients of the Work or
          Derivative Works a copy of this License; and

      (b) You must cause any modified files to carry prominent notices
          stating that You changed the files; and

      (c) You must retain, in the Source form of any Derivative Works
          that You distribute, all copyright, patent, trademark, and
          attribution notices from the Source form of the Work,
          excluding those notices that do not pertain to any part of
          the Derivative Works; and

      (d) If the Work includes a "NOTICE" text file as part of its
          distribution, then any Derivative Works that You distribute must
          include a readable copy of the attribution notices contained
          within such NOTICE file, excluding those notices that do not
          pertain to any part of the Derivative Works, in at least one
          of the following places: within a NOTICE text file distributed
          as part of the Derivative Works; within the Source form or
          documentation, if provided along with the Derivative Works; or,
          within a display generated by the Derivative Works, if and
          wherever such third-party notices normally appear. The contents
          of the NOTICE file are for informational purposes only and
          do not modify the License. You may add Your own attribution
          notices within Derivative Works that You distribute, alongside
          or as an addendum to the NOTICE text from the Work, provided
          that such additional attribution notices cannot be construed
          as modifying the License.

      You may add Your own copyright statement to Your modifications and
      may provide additional or different license terms and conditions
      for use, reproduction, or distribution of Your modifications, or
      for any such Derivative Works as a whole, provided Your use,
      reproduction, and distribution of the Work otherwise complies with
      the conditions stated in this License.

   5. Submission of Contributions. Unless You explicitly state otherwise,
      any Contribution intentionally submitted for inclusion in the Work
      by You to the Licensor shall be under the terms and conditions of
      this License, without any additional terms or conditions.
      Notwithstanding the above, nothing herein shall supersede or modify
      the terms of any separate license agreement you may have executed
      with Licensor regarding such Contributions.

   6. Trademarks. This License does not grant permission to use the trade
      names, trademarks, service marks, or product names of the Licensor,
      except as required for reasonable and customary use in describing the
      origin of the Work and reproducing the content of the NOTICE file.

   7. Disclaimer of Warranty. Unless required by applicable law or
      agreed to in writing, Licensor provides the Work (and each
      Contributor provides its Contributions) on an "AS IS" BASIS,
      WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or
      implied, including, without limitation, any warranties or conditions
      of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A
      PARTICULAR PURPOSE. You are solely responsible for determining the
      appropriateness of using or redistributing the Work and assume any
      risks associated with Your exercise of permissions under this License.

   8. Limitation of Liability. In no event and under no legal theory,
      whether in tort (including negligence), contract, or otherwise,
      unless required by applicable law (such as deliberate and grossly
      negligent acts) or agreed to in writing, shall any Contributor be
      liable to You for damages, including any direct, indirect, special,
      incidental, or consequential damages of any character arising as a
      result of this License or out of the use or inability to use the
      Work (including but not limited to damages for loss of goodwill,
      work stoppage, computer failure or malfunction, or any and all
      other commercial damages or losses), even if such Contributor
      has been advised of the possibility of such damages.

   9. Accepting Warranty or Additional Liability. While redistributing
      the Work or Derivative Works thereof, You may choose to offer,
      and charge a fee for, acceptance of support, warranty, indemnity,
      or other liability obligations and/or rights consistent with this
      License. However, in accepting such obligations, You may act only
      on Your own behalf and on Your sole responsibility, not on behalf
      of any other Contributor, and only if You agree to indemnify,
      defend, and hold each Contributor harmless for any liability
      incurred by, or claims asserted against, such Contributor by reason
      of your accepting any such warranty or additional liability.

   END OF TERMS AND CONDITIONS

   APPENDIX: How to apply the Apache License to your work.

      To apply the Apache License to your work, attach the following
      boilerplate notice, with the fields enclosed by brackets "[]"
      replaced with your own identifying information. (Don't include
      the brackets!)  The text should be enclosed in the appropriate
      comment syntax for the file format. We also recommend that a
      file or class name and description of purpose be included on the
      same "printed page" as the copyright notice for easier
      identification within third-party archives.

   Copyright 2020 Dell Inc. or its subsidiaries. All Rights Reserved. 

   Licensed under the Apache License, Version 2.0 (the "License");
   you may not use this file except in compliance with the License.
   You may obtain a copy of the License at

       http://www.apache.org/licenses/LICENSE-2.0

   Unless required by applicable law or agreed to in writing, software
   distributed under the License is distributed on an "AS IS" BASIS,
   WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
   See the License for the specific language governing permissions and
   limitations under the License.


================================================
FILE: README.md
================================================
<img src="docs/logos/omnia-logo-transparent.png" width="500px">
<!-- ALL-CONTRIBUTORS-BADGE:START - Do not remove or modify this section -->
<!-- DO NOT ADD A BADGE -->
<!-- ALL-CONTRIBUTORS-BADGE:END -->


![GitHub](https://img.shields.io/github/license/dell/omnia) ![GitHub release (latest by date including pre-releases)](https://img.shields.io/github/v/release/dell/omnia?include_prereleases) ![GitHub last commit (branch)](https://img.shields.io/github/last-commit/dell/omnia/main) ![GitHub commits since tagged version](https://img.shields.io/github/commits-since/dell/omnia/v1.5/main)

![All contributors](https://img.shields.io/github/all-contributors/dell/omnia) ![GitHub forks](https://img.shields.io/github/forks/dell/omnia) ![GitHub Repo stars](https://img.shields.io/github/stars/dell/omnia) ![GitHub all releases](https://img.shields.io/github/downloads/dell/omnia/total)

![GitHub issues](https://img.shields.io/github/issues-raw/dell/omnia) ![GitHub Discussions](https://img.shields.io/github/discussions/dell/omnia)[<img src="https://img.shields.io/badge/slack-dell-blue.svg?logo=slack">](https://app.slack.com/client/TH80K68HY/C018L5109PW)

#### Ansible playbook-based deployment of Slurm and Kubernetes on servers running on Linux OS.

Omnia is an open-source deployment toolkit that helps customers efficiently manage compute servers, storage, and networking within complex environments.
 
Omnia utilizes Ansible playbook-based deployment to automate OS provisioning, driver installation and configuration, deployment of schedulers like Slurm and Kubernetes, as well as optimization libraries, machine learning frameworks/platforms and AI models.


## Omnia Documentation

Omnia 1.x Documentation is hosted on [Read The Docs 1.x](https://omnia-doc.readthedocs.io/en/latest/index.html).

Omnia 2.x Documentation is hosted on [Read The Docs 2.x](https://omnia.readthedocs.io/en/latest/index.html).

Current Status: ![GitHub](https://readthedocs.org/projects/omnia/badge/?version=latest)

## Licensing

Omnia is made available under the [Apache 2.0 license](https://opensource.org/licenses/Apache-2.0)

## Contributing To Omnia

We encourage everyone to help us improve Omnia by contributing to the project. Contributions can be as small as documentation updates or adding example use cases, to adding commenting and properly styling code segments all the way up to full feature contributions. We ask that contributors follow our established [guidelines](https://omnia.readthedocs.io/en/latest/Contributing/index.html) for contributing to the project.


## Omnia Community Members:
<img src="docs/logos/delltech.jpg" height="80px" alt="Dell Technologies">
<img src="https://upload.wikimedia.org/wikipedia/commons/0/0e/Intel_logo_%282020%2C_light_blue%29.svg" height="50px" alt="Intel Corporation"> 

<img src="docs/logos/pisa.png" height="60px" alt="Universita di Pisa"> <img src="https://user-images.githubusercontent.com/83095575/117071024-64956c80-ace3-11eb-9d90-2dac7daef11c.png" height="50px" alt="Arizona State University"> <img src="https://images.squarespace-cdn.com/content/v1/660f1a48587dbb2769709a33/9ac5520f-a308-4751-80f4-415d07a23473/VIZIAS+Blue.png" height="50px" alt="Vizias">

<img src="https://cdn.prod.website-files.com/5ab1342d0735aa53115fca62/5d00133d02bbf495113e8bca_Liqid-Composable-Infrastructure-Blue-Wave-Black-Logotype.svg" height="50px" alt="LIQID Inc."> <img src="https://user-images.githubusercontent.com/5414112/153955170-0a4b199a-54f0-42af-939c-03eac76881c0.png" height="60px" alt="Texas Tech University">

## Contributors
Our thanks go to everyone who makes Omnia possible ([emoji key](https://allcontributors.org/docs/en/emoji-key)):
<!-- ALL-CONTRIBUTORS-LIST:START - Do not remove or modify this section -->
<!-- prettier-ignore-start -->
<!-- markdownlint-disable -->
<table>
  <tbody>
    <tr>
      <td align="center" valign="top" width="14.28%"><a href="http://johnlockman.com"><img src="https://avatars.githubusercontent.com/u/912987?v=4?s=100" width="100px;" alt="John Lockman"/><br /><sub><b>John Lockman</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=j0hnL" title="Tests">⚠️</a> <a href="https://github.com/dell/omnia/commits?author=j0hnL" title="Code">💻</a> <a href="#blog-j0hnL" title="Blogposts">📝</a> <a href="#ideas-j0hnL" title="Ideas, Planning, & Feedback">🤔</a> <a href="#maintenance-j0hnL" title="Maintenance">🚧</a> <a href="#mentoring-j0hnL" title="Mentoring">🧑‍🏫</a> <a href="#design-j0hnL" title="Design">🎨</a> <a href="https://github.com/dell/omnia/pulls?q=is%3Apr+reviewed-by%3Aj0hnL" title="Reviewed Pull Requests">👀</a> <a href="#talk-j0hnL" title="Talks">📢</a> <a href="https://github.com/dell/omnia/issues?q=author%3Aj0hnL" title="Bug reports">🐛</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/lwilson"><img src="https://avatars.githubusercontent.com/u/1236922?v=4?s=100" width="100px;" alt="Lucas A. Wilson"/><br /><sub><b>Lucas A. Wilson</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=lwilson" title="Code">💻</a> <a href="#design-lwilson" title="Design">🎨</a> <a href="#maintenance-lwilson" title="Maintenance">🚧</a> <a href="#ideas-lwilson" title="Ideas, Planning, & Feedback">🤔</a> <a href="#blog-lwilson" title="Blogposts">📝</a> <a href="https://github.com/dell/omnia/commits?author=lwilson" title="Documentation">📖</a> <a href="#mentoring-lwilson" title="Mentoring">🧑‍🏫</a> <a href="#projectManagement-lwilson" title="Project Management">📆</a> <a href="https://github.com/dell/omnia/pulls?q=is%3Apr+reviewed-by%3Alwilson" title="Reviewed Pull Requests">👀</a> <a href="#talk-lwilson" title="Talks">📢</a> <a href="https://github.com/dell/omnia/issues?q=author%3Alwilson" title="Bug reports">🐛</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/sujit-jadhav"><img src="https://avatars.githubusercontent.com/u/73123831?v=4?s=100" width="100px;" alt="Sujit Jadhav"/><br /><sub><b>Sujit Jadhav</b></sub></a><br /><a href="#ideas-sujit-jadhav" title="Ideas, Planning, & Feedback">🤔</a> <a href="https://github.com/dell/omnia/commits?author=sujit-jadhav" title="Documentation">📖</a> <a href="https://github.com/dell/omnia/commits?author=sujit-jadhav" title="Code">💻</a> <a href="https://github.com/dell/omnia/pulls?q=is%3Apr+reviewed-by%3Asujit-jadhav" title="Reviewed Pull Requests">👀</a> <a href="#maintenance-sujit-jadhav" title="Maintenance">🚧</a> <a href="#projectManagement-sujit-jadhav" title="Project Management">📆</a> <a href="#mentoring-sujit-jadhav" title="Mentoring">🧑‍🏫</a> <a href="#talk-sujit-jadhav" title="Talks">📢</a> <a href="#question-sujit-jadhav" title="Answering Questions">💬</a> <a href="https://github.com/dell/omnia/commits?author=sujit-jadhav" title="Tests">⚠️</a> <a href="https://github.com/dell/omnia/issues?q=author%3Asujit-jadhav" title="Bug reports">🐛</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/DeepikaKrishnaiah"><img src="https://avatars.githubusercontent.com/u/73213880?v=4?s=100" width="100px;" alt="Deepika K"/><br /><sub><b>Deepika K</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=DeepikaKrishnaiah" title="Code">💻</a> <a href="https://github.com/dell/omnia/commits?author=DeepikaKrishnaiah" title="Tests">⚠️</a> <a href="https://github.com/dell/omnia/issues?q=author%3ADeepikaKrishnaiah" title="Bug reports">🐛</a> <a href="#security-DeepikaKrishnaiah" title="Security">🛡️</a> <a href="#talk-DeepikaKrishnaiah" title="Talks">📢</a> <a href="https://github.com/dell/omnia/pulls?q=is%3Apr+reviewed-by%3ADeepikaKrishnaiah" title="Reviewed Pull Requests">👀</a> <a href="#mentoring-DeepikaKrishnaiah" title="Mentoring">🧑‍🏫</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/abhishek-sa1"><img src="https://avatars.githubusercontent.com/u/94038029?v=4?s=100" width="100px;" alt="Abhishek SA"/><br /><sub><b>Abhishek SA</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=abhishek-sa1" title="Code">💻</a> <a href="https://github.com/dell/omnia/issues?q=author%3Aabhishek-sa1" title="Bug reports">🐛</a> <a href="https://github.com/dell/omnia/commits?author=abhishek-sa1" title="Documentation">📖</a> <a href="https://github.com/dell/omnia/commits?author=abhishek-sa1" title="Tests">⚠️</a> <a href="#maintenance-abhishek-sa1" title="Maintenance">🚧</a> <a href="#talk-abhishek-sa1" title="Talks">📢</a> <a href="#mentoring-abhishek-sa1" title="Mentoring">🧑‍🏫</a> <a href="https://github.com/dell/omnia/pulls?q=is%3Apr+reviewed-by%3Aabhishek-sa1" title="Reviewed Pull Requests">👀</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/sakshiarora13"><img src="https://avatars.githubusercontent.com/u/73195862?v=4?s=100" width="100px;" alt="Sakshi Arora"/><br /><sub><b>Sakshi Arora</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=sakshiarora13" title="Code">💻</a> <a href="https://github.com/dell/omnia/issues?q=author%3Asakshiarora13" title="Bug reports">🐛</a> <a href="#talk-sakshiarora13" title="Talks">📢</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/Shubhangi-dell"><img src="https://avatars.githubusercontent.com/u/72869337?v=4?s=100" width="100px;" alt="Shubhangi Srivastava"/><br /><sub><b>Shubhangi Srivastava</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=Shubhangi-dell" title="Code">💻</a> <a href="#maintenance-Shubhangi-dell" title="Maintenance">🚧</a> <a href="https://github.com/dell/omnia/issues?q=author%3AShubhangi-dell" title="Bug reports">🐛</a> <a href="#talk-Shubhangi-dell" title="Talks">📢</a></td>
    </tr>
    <tr>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/cgoveas"><img src="https://avatars.githubusercontent.com/u/88071888?v=4?s=100" width="100px;" alt="Cassey Goveas"/><br /><sub><b>Cassey Goveas</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=cgoveas" title="Documentation">📖</a> <a href="https://github.com/dell/omnia/issues?q=author%3Acgoveas" title="Bug reports">🐛</a> <a href="#maintenance-cgoveas" title="Maintenance">🚧</a> <a href="#talk-cgoveas" title="Talks">📢</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/Khushboodholi"><img src="https://avatars.githubusercontent.com/u/12014935?v=4?s=100" width="100px;" alt="Khushboo Dholi"/><br /><sub><b>Khushboo Dholi</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=Khushboodholi" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/prasoon-sinha"><img src="https://avatars.githubusercontent.com/u/5362594?v=4?s=100" width="100px;" alt="Prasoon Kumar Sinha"/><br /><sub><b>Prasoon Kumar Sinha</b></sub></a><br /><a href="#ideas-prasoon-sinha" title="Ideas, Planning, & Feedback">🤔</a> <a href="#talk-prasoon-sinha" title="Talks">📢</a> <a href="#mentoring-prasoon-sinha" title="Mentoring">🧑‍🏫</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/SajithDas"><img src="https://avatars.githubusercontent.com/u/78676226?v=4?s=100" width="100px;" alt="SajithDas"/><br /><sub><b>SajithDas</b></sub></a><br /><a href="#projectManagement-SajithDas" title="Project Management">📆</a> <a href="#talk-SajithDas" title="Talks">📢</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/i3igpete"><img src="https://avatars.githubusercontent.com/u/33877827?v=4?s=100" width="100px;" alt="i3igpete"/><br /><sub><b>i3igpete</b></sub></a><br /><a href="#business-i3igpete" title="Business development">💼</a> <a href="#talk-i3igpete" title="Talks">📢</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/renzo-granados"><img src="https://avatars.githubusercontent.com/u/83035817?v=4?s=100" width="100px;" alt="renzo-granados"/><br /><sub><b>renzo-granados</b></sub></a><br /><a href="https://github.com/dell/omnia/issues?q=author%3Arenzo-granados" title="Bug reports">🐛</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/Aditya-DP"><img src="https://avatars.githubusercontent.com/u/115771515?v=4?s=100" width="100px;" alt="Aditya-DP"/><br /><sub><b>Aditya-DP</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=Aditya-DP" title="Code">💻</a> <a href="https://github.com/dell/omnia/issues?q=author%3AAditya-DP" title="Bug reports">🐛</a> <a href="https://github.com/dell/omnia/commits?author=Aditya-DP" title="Tests">⚠️</a></td>
    </tr>
    <tr>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/Katakam-Rakesh"><img src="https://avatars.githubusercontent.com/u/125246792?v=4?s=100" width="100px;" alt="Katakam Rakesh Naga Sai"/><br /><sub><b>Katakam Rakesh Naga Sai</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=Katakam-Rakesh" title="Code">💻</a> <a href="https://github.com/dell/omnia/issues?q=author%3AKatakam-Rakesh" title="Bug reports">🐛</a> <a href="https://github.com/dell/omnia/commits?author=Katakam-Rakesh" title="Tests">⚠️</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/araji"><img src="https://avatars.githubusercontent.com/u/216020?v=4?s=100" width="100px;" alt="araji"/><br /><sub><b>araji</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=araji" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://mike.renf.ro/blog/"><img src="https://avatars.githubusercontent.com/u/1451881?v=4?s=100" width="100px;" alt="Mike Renfro"/><br /><sub><b>Mike Renfro</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=mikerenfro" title="Documentation">📖</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/leereyno-asu"><img src="https://avatars.githubusercontent.com/u/81774548?v=4?s=100" width="100px;" alt="Lee Reynolds"/><br /><sub><b>Lee Reynolds</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=leereyno-asu" title="Code">💻</a> <a href="https://github.com/dell/omnia/commits?author=leereyno-asu" title="Documentation">📖</a> <a href="#tutorial-leereyno-asu" title="Tutorials">✅</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/blesson-james"><img src="https://avatars.githubusercontent.com/u/72782936?v=4?s=100" width="100px;" alt="blesson-james"/><br /><sub><b>blesson-james</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=blesson-james" title="Code">💻</a> <a href="https://github.com/dell/omnia/commits?author=blesson-james" title="Tests">⚠️</a> <a href="https://github.com/dell/omnia/issues?q=author%3Ablesson-james" title="Bug reports">🐛</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/avinashvishwanath"><img src="https://avatars.githubusercontent.com/u/77823538?v=4?s=100" width="100px;" alt="avinashvishwanath"/><br /><sub><b>avinashvishwanath</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=avinashvishwanath" title="Documentation">📖</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/abhishek-s-a"><img src="https://avatars.githubusercontent.com/u/73212230?v=4?s=100" width="100px;" alt="abhishek-s-a"/><br /><sub><b>abhishek-s-a</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=abhishek-s-a" title="Code">💻</a> <a href="https://github.com/dell/omnia/commits?author=abhishek-s-a" title="Documentation">📖</a> <a href="https://github.com/dell/omnia/commits?author=abhishek-s-a" title="Tests">⚠️</a></td>
    </tr>
    <tr>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/Franklin-Johnson"><img src="https://avatars.githubusercontent.com/u/84760103?v=4?s=100" width="100px;" alt="Franklin-Johnson"/><br /><sub><b>Franklin-Johnson</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=Franklin-Johnson" title="Code">💻</a> <a href="#blog-Franklin-Johnson" title="Blogposts">📝</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/teiland7"><img src="https://avatars.githubusercontent.com/u/85184708?v=4?s=100" width="100px;" alt="teiland7"/><br /><sub><b>teiland7</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=teiland7" title="Code">💻</a> <a href="#blog-teiland7" title="Blogposts">📝</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/VishnupriyaKrish"><img src="https://avatars.githubusercontent.com/u/72784834?v=4?s=100" width="100px;" alt="VishnupriyaKrish"/><br /><sub><b>VishnupriyaKrish</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=VishnupriyaKrish" title="Code">💻</a> <a href="https://github.com/dell/omnia/commits?author=VishnupriyaKrish" title="Tests">⚠️</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://rb.gy/ndlbhv"><img src="https://avatars.githubusercontent.com/u/48859631?v=4?s=100" width="100px;" alt="Ishita Datta"/><br /><sub><b>Ishita Datta</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=ishitadatta" title="Documentation">📖</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/asu-wdizon"><img src="https://avatars.githubusercontent.com/u/81772355?v=4?s=100" width="100px;" alt="William Dizon"/><br /><sub><b>William Dizon</b></sub></a><br /><a href="#tutorial-asu-wdizon" title="Tutorials">✅</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/bssitton-BU"><img src="https://avatars.githubusercontent.com/u/14130464?v=4?s=100" width="100px;" alt="bssitton-BU"/><br /><sub><b>bssitton-BU</b></sub></a><br /><a href="https://github.com/dell/omnia/issues?q=author%3Abssitton-BU" title="Bug reports">🐛</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/hearnsj"><img src="https://avatars.githubusercontent.com/u/19259589?v=4?s=100" width="100px;" alt="John Hearns"/><br /><sub><b>John Hearns</b></sub></a><br /><a href="https://github.com/dell/omnia/issues?q=author%3Ahearnsj" title="Bug reports">🐛</a></td>
    </tr>
    <tr>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/kbuggenhout"><img src="https://avatars.githubusercontent.com/u/30471699?v=4?s=100" width="100px;" alt="kris buggenhout"/><br /><sub><b>kris buggenhout</b></sub></a><br /><a href="https://github.com/dell/omnia/issues?q=author%3Akbuggenhout" title="Bug reports">🐛</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/jiad-vmware"><img src="https://avatars.githubusercontent.com/u/68653329?v=4?s=100" width="100px;" alt="jiad-vmware"/><br /><sub><b>jiad-vmware</b></sub></a><br /><a href="https://github.com/dell/omnia/issues?q=author%3Ajiad-vmware" title="Bug reports">🐛</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://jlec.de"><img src="https://avatars.githubusercontent.com/u/79732?v=4?s=100" width="100px;" alt="Justin Lecher"/><br /><sub><b>Justin Lecher</b></sub></a><br /><a href="#ideas-jlec" title="Ideas, Planning, & Feedback">🤔</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/Kavyabr23"><img src="https://avatars.githubusercontent.com/u/90390587?v=4?s=100" width="100px;" alt="Kavyabr23"/><br /><sub><b>Kavyabr23</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=Kavyabr23" title="Code">💻</a> <a href="https://github.com/dell/omnia/commits?author=Kavyabr23" title="Tests">⚠️</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/vedaprakashanp"><img src="https://avatars.githubusercontent.com/u/90596073?v=4?s=100" width="100px;" alt="vedaprakashanp"/><br /><sub><b>vedaprakashanp</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=vedaprakashanp" title="Tests">⚠️</a> <a href="https://github.com/dell/omnia/commits?author=vedaprakashanp" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/Bhagyashree-shetty"><img src="https://avatars.githubusercontent.com/u/90620926?v=4?s=100" width="100px;" alt="Bhagyashree-shetty"/><br /><sub><b>Bhagyashree-shetty</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=Bhagyashree-shetty" title="Tests">⚠️</a> <a href="https://github.com/dell/omnia/commits?author=Bhagyashree-shetty" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/nihalranjan-hpc"><img src="https://avatars.githubusercontent.com/u/84398828?v=4?s=100" width="100px;" alt="Nihal Ranjan"/><br /><sub><b>Nihal Ranjan</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=nihalranjan-hpc" title="Tests">⚠️</a> <a href="https://github.com/dell/omnia/commits?author=nihalranjan-hpc" title="Code">💻</a> <a href="#talk-nihalranjan-hpc" title="Talks">📢</a> <a href="https://github.com/dell/omnia/issues?q=author%3Anihalranjan-hpc" title="Bug reports">🐛</a></td>
    </tr>
    <tr>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/ptrinesh"><img src="https://avatars.githubusercontent.com/u/73214211?v=4?s=100" width="100px;" alt="ptrinesh"/><br /><sub><b>ptrinesh</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=ptrinesh" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://bandism.net/"><img src="https://avatars.githubusercontent.com/u/22633385?v=4?s=100" width="100px;" alt="Ikko Ashimine"/><br /><sub><b>Ikko Ashimine</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=eltociear" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/Lakshmi-Patneedi"><img src="https://avatars.githubusercontent.com/u/94051091?v=4?s=100" width="100px;" alt="Lakshmi-Patneedi"/><br /><sub><b>Lakshmi-Patneedi</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=Lakshmi-Patneedi" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/Artlands"><img src="https://avatars.githubusercontent.com/u/31781106?v=4?s=100" width="100px;" alt="Jie Li"/><br /><sub><b>Jie Li</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=Artlands" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/githubyongchen"><img src="https://avatars.githubusercontent.com/u/5414112?v=4?s=100" width="100px;" alt="Yong Chen"/><br /><sub><b>Yong Chen</b></sub></a><br /><a href="#design-githubyongchen" title="Design">🎨</a></td>
      <td align="center" valign="top" width="14.28%"><a href="http://www.myweb.ttu.edu/ngu00336/"><img src="https://avatars.githubusercontent.com/u/18387748?v=4?s=100" width="100px;" alt="nvtngan"/><br /><sub><b>nvtngan</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=Zipexpo" title="Code">💻</a> <a href="#plugin-Zipexpo" title="Plugin/utility libraries">🔌</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/tamilarasansubrama1"><img src="https://avatars.githubusercontent.com/u/100588942?v=4?s=100" width="100px;" alt="tamilarasansubrama1"/><br /><sub><b>tamilarasansubrama1</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=tamilarasansubrama1" title="Tests">⚠️</a> <a href="https://github.com/dell/omnia/commits?author=tamilarasansubrama1" title="Code">💻</a></td>
    </tr>
    <tr>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/shemasr"><img src="https://avatars.githubusercontent.com/u/100141664?v=4?s=100" width="100px;" alt="shemasr"/><br /><sub><b>shemasr</b></sub></a><br /><a href="https://github.com/dell/omnia/issues?q=author%3Ashemasr" title="Bug reports">🐛</a> <a href="https://github.com/dell/omnia/commits?author=shemasr" title="Code">💻</a> <a href="https://github.com/dell/omnia/commits?author=shemasr" title="Tests">⚠️</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/naresh3774"><img src="https://avatars.githubusercontent.com/u/101410892?v=4?s=100" width="100px;" alt="Naresh Sharma"/><br /><sub><b>Naresh Sharma</b></sub></a><br /><a href="https://github.com/dell/omnia/issues?q=author%3Anaresh3774" title="Bug reports">🐛</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/JonHass"><img src="https://avatars.githubusercontent.com/u/6976486?v=4?s=100" width="100px;" alt="Jon Hass"/><br /><sub><b>Jon Hass</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=JonHass" title="Documentation">📖</a> <a href="#design-JonHass" title="Design">🎨</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/KalyanKonatham"><img src="https://avatars.githubusercontent.com/u/101596828?v=4?s=100" width="100px;" alt="KalyanKonatham"/><br /><sub><b>KalyanKonatham</b></sub></a><br /><a href="https://github.com/dell/omnia/issues?q=author%3AKalyanKonatham" title="Bug reports">🐛</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/rahulakolkar"><img src="https://avatars.githubusercontent.com/u/22768133?v=4?s=100" width="100px;" alt="Rahul Akolkar"/><br /><sub><b>Rahul Akolkar</b></sub></a><br /><a href="https://github.com/dell/omnia/issues?q=author%3Arahulakolkar" title="Bug reports">🐛</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/srinandini-karumuri"><img src="https://avatars.githubusercontent.com/u/104345504?v=4?s=100" width="100px;" alt="srinandini-karumuri"/><br /><sub><b>srinandini-karumuri</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=srinandini-karumuri" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/Rishabhm47"><img src="https://avatars.githubusercontent.com/u/106973551?v=4?s=100" width="100px;" alt="Rishabhm47"/><br /><sub><b>Rishabhm47</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=Rishabhm47" title="Tests">⚠️</a> <a href="https://github.com/dell/omnia/commits?author=Rishabhm47" title="Code">💻</a></td>
    </tr>
    <tr>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/vaishakh-pm"><img src="https://avatars.githubusercontent.com/u/104622022?v=4?s=100" width="100px;" alt="vaishakh-pm"/><br /><sub><b>vaishakh-pm</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=vaishakh-pm" title="Tests">⚠️</a> <a href="https://github.com/dell/omnia/commits?author=vaishakh-pm" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/shridhar-sharma"><img src="https://avatars.githubusercontent.com/u/104621992?v=4?s=100" width="100px;" alt="shridhar-sharma"/><br /><sub><b>shridhar-sharma</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=shridhar-sharma" title="Tests">⚠️</a> <a href="https://github.com/dell/omnia/commits?author=shridhar-sharma" title="Code">💻</a> <a href="https://github.com/dell/omnia/issues?q=author%3Ashridhar-sharma" title="Bug reports">🐛</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/JayaDayyala"><img src="https://avatars.githubusercontent.com/u/108455487?v=4?s=100" width="100px;" alt="Jaya.Dayyala"/><br /><sub><b>Jaya.Dayyala</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=JayaDayyala" title="Tests">⚠️</a> <a href="https://github.com/dell/omnia/commits?author=JayaDayyala" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/fasongan"><img src="https://avatars.githubusercontent.com/u/16153657?v=4?s=100" width="100px;" alt="fasongan"/><br /><sub><b>fasongan</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=fasongan" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/rahuldell21"><img src="https://avatars.githubusercontent.com/u/117621375?v=4?s=100" width="100px;" alt="rahuldell21"/><br /><sub><b>rahuldell21</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=rahuldell21" title="Code">💻</a> <a href="https://github.com/dell/omnia/commits?author=rahuldell21" title="Tests">⚠️</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/diptiman12"><img src="https://avatars.githubusercontent.com/u/117987073?v=4?s=100" width="100px;" alt="diptiman12"/><br /><sub><b>diptiman12</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=diptiman12" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/SupriyaParthasarathy"><img src="https://avatars.githubusercontent.com/u/139955493?v=4?s=100" width="100px;" alt="Supriya Parthasarathy"/><br /><sub><b>Supriya Parthasarathy</b></sub></a><br /><a href="#projectManagement-SupriyaParthasarathy" title="Project Management">📆</a></td>
    </tr>
    <tr>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/Subhankar-Adak"><img src="https://avatars.githubusercontent.com/u/140381176?v=4?s=100" width="100px;" alt="Subhankar-Adak"/><br /><sub><b>Subhankar-Adak</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=Subhankar-Adak" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/priti-parate"><img src="https://avatars.githubusercontent.com/u/140157516?v=4?s=100" width="100px;" alt="priti-parate"/><br /><sub><b>priti-parate</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=priti-parate" title="Code">💻</a> <a href="https://github.com/dell/omnia/issues?q=author%3Apriti-parate" title="Bug reports">🐛</a> <a href="#talk-priti-parate" title="Talks">📢</a> <a href="#mentoring-priti-parate" title="Mentoring">🧑‍🏫</a> <a href="https://github.com/dell/omnia/pulls?q=is%3Apr+reviewed-by%3Apriti-parate" title="Reviewed Pull Requests">👀</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/lavanya5899"><img src="https://avatars.githubusercontent.com/u/140372459?v=4?s=100" width="100px;" alt="Lavanya Adhikari"/><br /><sub><b>Lavanya Adhikari</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=lavanya5899" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/preeti-thankachan"><img src="https://avatars.githubusercontent.com/u/141405483?v=4?s=100" width="100px;" alt="preeti-thankachan"/><br /><sub><b>preeti-thankachan</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=preeti-thankachan" title="Tests">⚠️</a> <a href="https://github.com/dell/omnia/issues?q=author%3Apreeti-thankachan" title="Bug reports">🐛</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/glimchb"><img src="https://avatars.githubusercontent.com/u/36732377?v=4?s=100" width="100px;" alt="Boris Glimcher"/><br /><sub><b>Boris Glimcher</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=glimchb" title="Code">💻</a> <a href="#maintenance-glimchb" title="Maintenance">🚧</a> <a href="https://github.com/dell/omnia/commits?author=glimchb" title="Documentation">📖</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/MoshiBin"><img src="https://avatars.githubusercontent.com/u/1297388?v=4?s=100" width="100px;" alt="Moshi Binyamini"/><br /><sub><b>Moshi Binyamini</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=MoshiBin" title="Code">💻</a> <a href="#maintenance-MoshiBin" title="Maintenance">🚧</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/paul-tp"><img src="https://avatars.githubusercontent.com/u/169248855?v=4?s=100" width="100px;" alt="paul-tp"/><br /><sub><b>paul-tp</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=paul-tp" title="Code">💻</a></td>
    </tr>
    <tr>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/Milisha-Gupta"><img src="https://avatars.githubusercontent.com/u/52577117?v=4?s=100" width="100px;" alt="Milisha Gupta"/><br /><sub><b>Milisha Gupta</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=Milisha-Gupta" title="Code">💻</a> <a href="https://github.com/dell/omnia/commits?author=Milisha-Gupta" title="Tests">⚠️</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/sakshi-singla-1735"><img src="https://avatars.githubusercontent.com/u/169248923?v=4?s=100" width="100px;" alt="sakshi-singla-1735"/><br /><sub><b>sakshi-singla-1735</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=sakshi-singla-1735" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/Sankeerna-S"><img src="https://avatars.githubusercontent.com/u/169250907?v=4?s=100" width="100px;" alt="Sankeerna-S"/><br /><sub><b>Sankeerna-S</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=Sankeerna-S" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/AjayKadoula"><img src="https://avatars.githubusercontent.com/u/38178003?v=4?s=100" width="100px;" alt="Ajay Kadoula"/><br /><sub><b>Ajay Kadoula</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=AjayKadoula" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/ShubhamKumar1996"><img src="https://avatars.githubusercontent.com/u/51914136?v=4?s=100" width="100px;" alt="ShubhamKumar1996"/><br /><sub><b>ShubhamKumar1996</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=ShubhamKumar1996" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/SanthoshT2001"><img src="https://avatars.githubusercontent.com/u/93521129?v=4?s=100" width="100px;" alt="SanthoshT2001"/><br /><sub><b>SanthoshT2001</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=SanthoshT2001" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/Kratika-P"><img src="https://avatars.githubusercontent.com/u/169249531?v=4?s=100" width="100px;" alt="Kratika-P"/><br /><sub><b>Kratika-P</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=Kratika-P" title="Code">💻</a> <a href="https://github.com/dell/omnia/commits?author=Kratika-P" title="Tests">⚠️</a></td>
    </tr>
    <tr>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/sbasu96"><img src="https://avatars.githubusercontent.com/u/162503707?v=4?s=100" width="100px;" alt="Soumyadeep Basu"/><br /><sub><b>Soumyadeep Basu</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=sbasu96" title="Documentation">📖</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/VrindaMarwah"><img src="https://avatars.githubusercontent.com/u/169263232?v=4?s=100" width="100px;" alt="VrindaMarwah"/><br /><sub><b>VrindaMarwah</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=VrindaMarwah" title="Code">💻</a> <a href="https://github.com/dell/omnia/commits?author=VrindaMarwah" title="Tests">⚠️</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/Kevin-Kodama"><img src="https://avatars.githubusercontent.com/u/163032741?v=4?s=100" width="100px;" alt="Kevin-Kodama"/><br /><sub><b>Kevin-Kodama</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=Kevin-Kodama" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/balajikumaran-c-s"><img src="https://avatars.githubusercontent.com/u/169248535?v=4?s=100" width="100px;" alt="balajikumaran-c-s"/><br /><sub><b>balajikumaran-c-s</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=balajikumaran-c-s" title="Code">💻</a> <a href="https://github.com/dell/omnia/commits?author=balajikumaran-c-s" title="Tests">⚠️</a> <a href="https://github.com/dell/omnia/issues?q=author%3Abalajikumaran-c-s" title="Bug reports">🐛</a> <a href="https://github.com/dell/omnia/commits?author=balajikumaran-c-s" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/Amogha-Reddy"><img src="https://avatars.githubusercontent.com/u/140503786?v=4?s=100" width="100px;" alt="Amogha-Reddy"/><br /><sub><b>Amogha-Reddy</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=Amogha-Reddy" title="Tests">⚠️</a> <a href="https://github.com/dell/omnia/issues?q=author%3AAmogha-Reddy" title="Bug reports">🐛</a> <a href="https://github.com/dell/omnia/commits?author=Amogha-Reddy" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/krsandeepit"><img src="https://avatars.githubusercontent.com/u/162142649?v=4?s=100" width="100px;" alt="krsandeepit"/><br /><sub><b>krsandeepit</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=krsandeepit" title="Tests">⚠️</a> <a href="https://github.com/dell/omnia/issues?q=author%3Akrsandeepit" title="Bug reports">🐛</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/Yash-shetty1"><img src="https://avatars.githubusercontent.com/u/169258785?v=4?s=100" width="100px;" alt="Yash-shetty1"/><br /><sub><b>Yash-shetty1</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=Yash-shetty1" title="Tests">⚠️</a> <a href="https://github.com/dell/omnia/issues?q=author%3AYash-shetty1" title="Bug reports">🐛</a></td>
    </tr>
    <tr>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/nethramg"><img src="https://avatars.githubusercontent.com/u/146437298?v=4?s=100" width="100px;" alt="Nethravathi M G"/><br /><sub><b>Nethravathi M G</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=nethramg" title="Code">💻</a> <a href="#projectManagement-nethramg" title="Project Management">📆</a> <a href="#talk-nethramg" title="Talks">📢</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/AbdulRijwan"><img src="https://avatars.githubusercontent.com/u/170396052?v=4?s=100" width="100px;" alt="Abdul Rijwan"/><br /><sub><b>Abdul Rijwan</b></sub></a><br /><a href="#infra-AbdulRijwan" title="Infrastructure (Hosting, Build-Tools, etc)">🚇</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/dweineha"><img src="https://avatars.githubusercontent.com/u/42206500?v=4?s=100" width="100px;" alt="David Weinehall"/><br /><sub><b>David Weinehall</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=dweineha" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/VenkateswaraVatam"><img src="https://avatars.githubusercontent.com/u/153504816?v=4?s=100" width="100px;" alt="Venkateswara Vatam"/><br /><sub><b>Venkateswara Vatam</b></sub></a><br /><a href="#projectManagement-VenkateswaraVatam" title="Project Management">📆</a> <a href="#talk-VenkateswaraVatam" title="Talks">📢</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/snarthan"><img src="https://avatars.githubusercontent.com/u/171680285?v=4?s=100" width="100px;" alt="Narthan S"/><br /><sub><b>Narthan S</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=snarthan" title="Code">💻</a> <a href="#mentoring-snarthan" title="Mentoring">🧑‍🏫</a> <a href="https://github.com/dell/omnia/pulls?q=is%3Apr+reviewed-by%3Asnarthan" title="Reviewed Pull Requests">👀</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/suman-square"><img src="https://avatars.githubusercontent.com/u/178771071?v=4?s=100" width="100px;" alt="Suman S"/><br /><sub><b>Suman S</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=suman-square" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/gurump21"><img src="https://avatars.githubusercontent.com/u/189354746?v=4?s=100" width="100px;" alt="Prabhu Gurumurthy"/><br /><sub><b>Prabhu Gurumurthy</b></sub></a><br /><a href="https://github.com/dell/omnia/issues?q=author%3Agurump21" title="Bug reports">🐛</a></td>
    </tr>
    <tr>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/Nagachandan-P"><img src="https://avatars.githubusercontent.com/Nagachandan-P?s=100" width="100px;" alt="Nagachandan P"/><br /><sub><b>Nagachandan P</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=Nagachandan-P" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/pranavkumar74980"><img src="https://avatars.githubusercontent.com/pranavkumar74980?s=100" width="100px;" alt="Pranav kumar"/><br /><sub><b>Pranav kumar</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=pranavkumar74980" title="Code">💻</a> <a href="https://github.com/dell/omnia/commits?author=pranavkumar74980" title="Tests">⚠️</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/aditi-sharma27"><img src="https://avatars.githubusercontent.com/aditi-sharma27?s=100" width="100px;" alt="Aditi Sharma"/><br /><sub><b>Aditi Sharma</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=aditi-sharma27" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/Rohith-Ravut"><img src="https://avatars.githubusercontent.com/u/196186062?v=4?s=100" width="100px;" alt="Rohith-Ravut"/><br /><sub><b>Rohith-Ravut</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=Rohith-Ravut" title="Tests">⚠️</a> <a href="https://github.com/dell/omnia/issues?q=author%3ARohith-Ravut" title="Bug reports">🐛</a> <a href="https://github.com/dell/omnia/commits?author=Rohith-Ravut" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/RvishankarOMnia"><img src="https://avatars.githubusercontent.com/u/186007052?v=4?s=100" width="100px;" alt="RvishankarOMnia"/><br /><sub><b>RvishankarOMnia</b></sub></a><br /><a href="#ideas-RvishankarOMnia" title="Ideas, Planning, & Feedback">🤔</a> <a href="#talk-RvishankarOMnia" title="Talks">📢</a> <a href="#mentoring-RvishankarOMnia" title="Mentoring">🧑‍🏫</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/jagadeeshnv"><img src="https://avatars.githubusercontent.com/u/39791839?v=4?s=100" width="100px;" alt="Jagadeesh N V"/><br /><sub><b>Jagadeesh N V</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=jagadeeshnv" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/sourabh-sahu1"><img src="https://avatars.githubusercontent.com/u/196315600?v=4?s=100" width="100px;" alt="sourabh-sahu1"/><br /><sub><b>sourabh-sahu1</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=sourabh-sahu1" title="Code">💻</a></td>
    </tr>
    <tr>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/ghandoura"><img src="https://avatars.githubusercontent.com/u/87424850?v=4?s=100" width="100px;" alt="Adam Ghandoura"/><br /><sub><b>Adam Ghandoura</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=ghandoura" title="Tests">⚠️</a> <a href="https://github.com/dell/omnia/commits?author=ghandoura" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/Coleman-Trader"><img src="https://avatars.githubusercontent.com/u/196217244?v=4?s=100" width="100px;" alt="Coleman-Trader"/><br /><sub><b>Coleman-Trader</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=Coleman-Trader" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/youngjae-hur7"><img src="https://avatars.githubusercontent.com/u/196205015?v=4?s=100" width="100px;" alt="youngjae-hur7"/><br /><sub><b>youngjae-hur7</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=youngjae-hur7" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/Grace-Chang2"><img src="https://avatars.githubusercontent.com/u/196347461?v=4?s=100" width="100px;" alt="Grace-Chang2"/><br /><sub><b>Grace-Chang2</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=Grace-Chang2" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/Cypher-Miller"><img src="https://avatars.githubusercontent.com/u/123703182?v=4?s=100" width="100px;" alt="Cypher-Miller"/><br /><sub><b>Cypher-Miller</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=Cypher-Miller" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/vvittal100"><img src="https://avatars.githubusercontent.com/u/202238575?v=4?s=100" width="100px;" alt="vvittal100"/><br /><sub><b>vvittal100</b></sub></a><br /><a href="#projectManagement-vvittal100" title="Project Management">📆</a> <a href="#talk-vvittal100" title="Talks">📢</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/kksenthilkumar"><img src="https://avatars.githubusercontent.com/u/202253529?v=4?s=100" width="100px;" alt="kksenthilkumar"/><br /><sub><b>kksenthilkumar</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=kksenthilkumar" title="Tests">⚠️</a></td>
    </tr>
    <tr>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/pullan1"><img src="https://avatars.githubusercontent.com/u/173048662?v=4?s=100" width="100px;" alt="pullan1"/><br /><sub><b>pullan1</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=pullan1" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/harshal2799"><img src="https://avatars.githubusercontent.com/u/202241497?v=4?s=100" width="100px;" alt="harshal2799"/><br /><sub><b>harshal2799</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=harshal2799" title="Tests">⚠️</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/Sindhu-Ranganath"><img src="https://avatars.githubusercontent.com/u/208789597?v=4?s=100" width="100px;" alt="Sindhu-Ranganath"/><br /><sub><b>Sindhu-Ranganath</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=Sindhu-Ranganath" title="Tests">⚠️</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/Manasa-Hemmanur"><img src="https://avatars.githubusercontent.com/u/205002578?v=4?s=100" width="100px;" alt="Manasa H"/><br /><sub><b>Manasa H</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=Manasa-Hemmanur" title="Code">💻</a> <a href="https://github.com/dell/omnia/commits?author=Manasa-Hemmanur" title="Tests">⚠️</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/Diya-Sumod"><img src="https://avatars.githubusercontent.com/u/225136254?v=4?s=100" width="100px;" alt="Diya-Sumod"/><br /><sub><b>Diya-Sumod</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=Diya-Sumod" title="Code">💻</a> <a href="https://github.com/dell/omnia/commits?author=Diya-Sumod" title="Tests">⚠️</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/Tanmay-Raj1004"><img src="https://avatars.githubusercontent.com/u/227950687?v=4?s=100" width="100px;" alt="Tanmay-Raj1004"/><br /><sub><b>Tanmay-Raj1004</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=Tanmay-Raj1004" title="Code">💻</a> <a href="https://github.com/dell/omnia/commits?author=Tanmay-Raj1004" title="Tests">⚠️</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/Anurag-Bijalwan"><img src="https://avatars.githubusercontent.com/u/218922922?v=4?s=100" width="100px;" alt="Anurag-Bijalwan"/><br /><sub><b>Anurag-Bijalwan</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=Anurag-Bijalwan" title="Code">💻</a></td>
    </tr>
    <tr>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/SOWJANYAJAGADISH123"><img src="https://avatars.githubusercontent.com/u/257989626?v=4?s=100" width="100px;" alt="SOWJANYAJAGADISH123"/><br /><sub><b>SOWJANYAJAGADISH123</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=SOWJANYAJAGADISH123" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/mithileshreddy04"><img src="https://avatars.githubusercontent.com/u/258000200?v=4?s=100" width="100px;" alt="mithileshreddy04"/><br /><sub><b>mithileshreddy04</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=mithileshreddy04" title="Code">💻</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/Rajeshkumar-s2"><img src="https://avatars.githubusercontent.com/u/242588082?v=4?s=100" width="100px;" alt="Rajeshkumar-s2"/><br /><sub><b>Rajeshkumar-s2</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=Rajeshkumar-s2" title="Code">💻</a> <a href="https://github.com/dell/omnia/commits?author=Rajeshkumar-s2" title="Tests">⚠️</a></td>
      <td align="center" valign="top" width="14.28%"><a href="https://github.com/Venu-p1"><img src="https://avatars.githubusercontent.com/u/236371043?v=4?s=100" width="100px;" alt="Venu-p1"/><br /><sub><b>Venu-p1</b></sub></a><br /><a href="https://github.com/dell/omnia/commits?author=Venu-p1" title="Code">💻</a> <a href="https://github.com/dell/omnia/commits?author=Venu-p1" title="Tests">⚠️</a></td>
    </tr>
  </tbody>
</table>

<!-- markdownlint-restore -->
<!-- prettier-ignore-end -->

<!-- ALL-CONTRIBUTORS-LIST:END -->


================================================
FILE: SECURITY.md
================================================
# Security Policy

## Supported Versions

Omnia provides security support for Omnia 1.7. All users utilizing older versions are highly recommended to upgrade to the latest version. Omnia 1.6.1 users are also highly recommended to upgrade to Omnia 1.7. The upgrade functionality allows users to upgrade from Omnia 1.6.1 to Omnia 1.7. The upgrade process ensures that all the security updates and fixes are applied to the system.


| Version | Supported          |
| ------- | ------------------ |
| 1.7     | :white_check_mark: |
| 1.6.1   | :white_check_mark: |
| 1.5.1   | :x:                |
| 1.4.3.1 | :x:                |


## Reporting a Vulnerability

To report a vulnerability, users can raise an issue with vulnerability details. Please include a CVE (Common Vulnerabilities and Exposures) identifier if one has been assigned to the issue. This will help us track the issue and ensure it is addressed appropriately.

If the vulnerability is accepted, the team will review the issue and make appropriate changes to fix the vulnerability. The fix can be expected in a minor patch release or will be included in the next major release.

In case the vulnerability is deemed to be high risk, the team may also provide a temporary fix or workaround until the next release is available.

However, if the vulnerability is deemed to be low risk or is not covered in the product security coverage scope, the issue may be denied.


================================================
FILE: ansible.cfg
================================================
[defaults]
log_path = /opt/omnia/log/core/playbooks/omnia.log
# Set the remote temporary directory to a shared path to avoid SELinux issues
remote_tmp = /opt/omnia/tmp/.ansible/tmp/
host_key_checking = false
forks = 5
timeout = 180
executable = /bin/bash
display_skipped_hosts = false
library = discovery/library:common/library/modules
#inventory = /opt/omnia/omnia_inventory/cluster_layout
module_utils = common/library/module_utils

[persistent_connection]
command_timeout = 180
connect_timeout = 180

[ssh_connection]
retries = 3
ssh_args = -o ControlMaster=auto -o ControlPersist=60 -o ConnectTimeout=60


================================================
FILE: build_image_aarch64/ansible.cfg
================================================
[defaults]
log_path = /opt/omnia/log/core/playbooks/build_image_aarch64.log
remote_tmp = /opt/omnia/tmp/.ansible/tmp/
host_key_checking = false
forks = 5
timeout = 180
executable = /bin/bash
library = ../common/library/modules
module_utils = ../common/library/module_utils

[persistent_connection]
command_timeout = 180
connect_timeout = 180

[ssh_connection]
retries = 3
ssh_args = -o ControlMaster=auto -o ControlPersist=60 -o ConnectTimeout=60


================================================
FILE: build_image_aarch64/build_image_aarch64.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Check if upgrade is in progress
  ansible.builtin.import_playbook: ../utils/upgrade_checkup.yml

- name: Set_fact for fetch omnia config credentials
  hosts: localhost
  connection: local
  tags: always
  tasks:
    - name: Set dynamic run tags including 'build_aarch_image'
      when: not config_file_status | default(false) | bool
      ansible.builtin.set_fact:
        omnia_run_tags: "{{ (ansible_run_tags | default([]) + ['build_aarch_image']) | unique }}"
        cacheable: true

- name: Invoke validate_config.yml to perform L1 and L2 validations with build_image tag
  ansible.builtin.import_playbook: ../input_validation/validate_config.yml
  tags: always

- name: Invoke get_config_credentials.yml
  ansible.builtin.import_playbook: ../utils/credential_utility/get_config_credentials.yml

- name: Include input project directory
  when: not project_dir_status | default(false) | bool
  ansible.builtin.import_playbook: ../utils/include_input_dir.yml
  vars:
    openchami_vars_suppport: true
    omnia_metadata_support: true

- name: Load build_stream configuration
  hosts: localhost
  connection: local
  gather_facts: false
  tags: always
  tasks:
    - name: Include build_stream config file
      ansible.builtin.include_vars:
        file: "{{ input_project_dir }}/build_stream_config.yml"
      failed_when: false

    - name: Set build_stream variables from extra_vars
      ansible.builtin.set_fact:
        build_stream_job_id: "{{ job_id | default('') }}"
        build_stream_image_key: "{{ image_key | default('') }}"
        build_stream_functional_groups: "{{ functional_groups | default([]) }}"
        enable_build_stream_flag: "{{ enable_build_stream | default(false) | bool }}"

    - name: Debug - Show build_stream variables
      ansible.builtin.debug:
        msg:
          - "build_stream_job_id: {{ build_stream_job_id }}"
          - "build_stream_image_key: {{ build_stream_image_key }}"
          - "build_stream_functional_groups: {{ build_stream_functional_groups }}"
          - "enable_build_stream_flag: {{ enable_build_stream_flag }}"
        verbosity: 2

    - name: Fetch build_stream prerequisites
      ansible.builtin.include_role:
        name: fetch_packages
        tasks_from: build_stream_prerequisite.yml
      vars:
        job_id: "{{ build_stream_job_id }}"
        image_key: "{{ build_stream_image_key }}"
        functional_groups: "{{ build_stream_functional_groups }}"
        enable_build_stream: "{{ enable_build_stream_flag }}"
      when: enable_build_stream_flag

- name: Gather OIM data
  hosts: localhost
  gather_facts: false
  tasks:
    - name: Include gather_oim_data role
      ansible.builtin.include_role:
        name: prepare_arm_node
        tasks_from: gather_oim_data.yml
        vars_from: main

- name: Create oim group and provision group
  ansible.builtin.import_playbook: ../utils/create_container_group.yml
  vars:
    oim_group: true
  tags: always

- name: Configure auth for OpenCHAMI
  hosts: oim
  connection: ssh
  tasks:
    - name: OpenCHAMI cluster authentication
      ansible.builtin.include_tasks: "{{ playbook_dir }}/../common/tasks/common/openchami_auth.yml"
      vars:
        oim_node_name: "{{ hostvars['localhost']['oim_node_name'] }}"

- name: Generate functional groups configuration when enable_build_stream is false
  ansible.builtin.import_playbook: ../utils/generate_functional_groups.yml
  tags: always
  when: not enable_build_stream

- name: Verify aarch64 functional_group presnt
  hosts: localhost
  connection: local
  tasks:
    - name: Fetch aarch64 functional_groups
      ansible.builtin.include_role:
        name: fetch_packages
        tasks_from: check_aarch64_fg.yml
      when: not enable_build_stream

- name: Prepare aarch64 nodes
  hosts: admin_aarch64
  gather_facts: false
  roles:
    - prepare_arm_node

- name: Fetch packages for aarch64
  hosts: localhost
  connection: local
  gather_facts: false
  roles:
    - fetch_packages

- name: Openchmi build image for aarch_64
  hosts: localhost
  connection: local
  gather_facts: false
  roles:
    - image_creation

- name: Build aarch64 image completion
  hosts: localhost
  connection: local
  tasks:
    - name: Build Image completion
      ansible.builtin.include_role:
        name: fetch_packages
        tasks_from: aarch64_build_image_completion.yml


================================================
FILE: build_image_aarch64/roles/fetch_packages/tasks/aarch64_build_image_completion.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Build Image completion
  ansible.builtin.debug:
    msg: "{{ aarch64_build_image_completion_msg.splitlines() | join(' ') }}"


================================================
FILE: build_image_aarch64/roles/fetch_packages/tasks/build_stream_prerequisite.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Debug - Show explicitly passed variables
  ansible.builtin.debug:
    msg:
      - "job_id: {{ job_id | default('NOT_SET') }}"
      - "image_key: {{ image_key | default('NOT_SET') }}"
      - "functional_groups: {{ functional_groups | default('NOT_SET') }}"
      - "enable_build_stream: {{ enable_build_stream | default('NOT_SET') }}"
    verbosity: 2

- name: Set build_stream variables from explicitly passed values
  ansible.builtin.set_fact:
    build_stream_job_id: "{{ job_id }}"
    image_key: "{{ image_key }}"
    cacheable: true

- name: Normalize functional_groups input into list
  ansible.builtin.set_fact:
    functional_group_list: "{{ functional_groups if functional_groups is iterable and functional_groups is not string else (functional_groups | from_yaml) }}"
  when: functional_groups is defined and enable_build_stream

- name: Fail when build stream enabled without job id or functional groups
  ansible.builtin.fail:
    msg: "{{ build_stream_prerequisite_fail_msg }}"
  when:
    - enable_build_stream | bool
    - (build_stream_job_id | default('') | string) | length == 0 or (functional_group_list | default([]) | length == 0) or (image_key | default('') | string) | length == 0   # noqa: yaml[line-length]


================================================
FILE: build_image_aarch64/roles/fetch_packages/tasks/check_aarch64_fg.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Load functional_group_config.yml
  ansible.builtin.include_vars:
    file: "{{ functional_groups_config_path }}"
    name: functional_group_cfg

- name: Check for aarch64 functional groups
  ansible.builtin.set_fact:
    fg_aarch64: >-
      {{ functional_group_cfg.functional_groups
         | selectattr('name', 'search', '_aarch64$')
         | list
         | length > 0 }}
    cacheable: true

- name: Fail if aarch64 functional groups are not present
  ansible.builtin.fail:
    msg: "{{ functional_group_absent_msg.splitlines() | join(' ') }}"
  when: not fg_aarch64


================================================
FILE: build_image_aarch64/roles/fetch_packages/tasks/fetch_packages.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Fetch aarch64 default_packages.json and additional_packages.json software packages
  block:
    - name: Collect base image RPM packages (default + additional + admin_debug)
      base_image_package_collector:
        default_json_path: "{{ default_json_path }}"
        additional_json_path: "{{ additional_json_path | default('') }}"
        admin_debug_json_path: "{{ admin_debug_json_path | default('') }}"
        software_config_path: "{{ software_config_file_path }}"
      register: base_image_output

    - name: Set aarch64_base_image_packages
      ansible.builtin.set_fact:
        aarch64_base_image_packages: "{{ base_image_output.base_image_packages }}"

    - name: Debug package aarch64_base_image_packages
      ansible.builtin.debug:
        var: aarch64_base_image_packages
        verbosity: 2

    - name: Parse functional_group_config.yml to list
      functional_group_parser:
        functional_groups_file: "{{ functional_groups_file_path }}"
      register: functional_group_parser_list
      when: not enable_build_stream

    - name: Set fact for functional_group_list
      ansible.builtin.set_fact:
        functional_group_list: "{{ functional_group_parser_list.functional_groups }}"
      when: not enable_build_stream

    - name: Debug full functional group parser output
      ansible.builtin.debug:
        var: functional_group_list
        verbosity: 2

    - name: Read packages for compute image softwares
      image_package_collector:
        functional_groups: "{{ functional_group_list }}"
        software_config_file: "{{ software_config_file_path }}"
        input_project_dir: "{{ input_project_dir }}"
        additional_json_path: "{{ additional_json_path }}"
      register: compute_images_output

    - name: Save packages for aarch64 keys in compute_images_dict
      ansible.builtin.set_fact:
        compute_images_dict: >-
          {{
            compute_images_output.compute_images_dict
            | dict2items
            | selectattr('key', 'search', '_aarch64$')
            | items2dict
          }}

    - name: Debug software directory compute_images_dict
      ansible.builtin.debug:
        var: compute_images_dict
        verbosity: 2


================================================
FILE: build_image_aarch64/roles/fetch_packages/tasks/fetch_pulp_repos.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Fetch pulp endpoints when aarch_64 build_stream enabled
  block:
    - name: Fetch pulp endpoints for aarch64
      ansible.builtin.command: >
        pulp rpm distribution list --field name,base_url
      register: pulp_endpoints
      changed_when: false

    - name: Filter only aarch_64 distributions
      ansible.builtin.set_fact:
        pulp_aarch_64_distributions: >-
          {{ pulp_endpoints.stdout | from_json
            | selectattr('name', 'match', '^aarch64')
            | list }}

    - name: Build rhel_repos list from pulp_aarch_64_distributions
      ansible.builtin.set_fact:
        rhel_aarch64_repos: >-
          {{ pulp_aarch_64_distributions | map('combine', {'gpg': ''}) | list }}

    - name: Debug rhel_aarch64_repos
      ansible.builtin.debug:
        msg: "{{ rhel_aarch64_repos | to_nice_yaml(indent=2) }}"
        verbosity: 2


================================================
FILE: build_image_aarch64/roles/fetch_packages/tasks/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
- name: Check local_repo.yml execution
  block:
    - name: Check if local_repo.yml is executed successfully
      ansible.builtin.stat:
        path: "{{ metadata_file_path }}"
      register: metadata_file_status
  rescue:
    - name: Fail if metadata file is not present
      ansible.builtin.fail:
        msg: "{{ local_repo_check_msg }}"
      when: not metadata_file_status.stat.exists

- name: Initialize fg_aarch64 as false
  ansible.builtin.set_fact:
    fg_aarch64: "{{ fg_aarch64 | default(false) }}"
  when: enable_build_stream | default(false)

- name: Include functional groups config
  ansible.builtin.include_vars:
    file: "{{ functional_groups_file_path }}"
    name: functional_groups_config
  when: not enable_build_stream

- name: Set functional_groups_file_path for build_stream disabled flow
  ansible.builtin.set_fact:
    functional_groups_file_path: "{{ functional_groups_file_path }}"
  when: not enable_build_stream

- name: Include software config
  ansible.builtin.include_vars:
    file: "{{ software_config_file_path }}"
    name: software_config
  when: enable_build_stream | default(false)

- name: Set cluster OS facts
  ansible.builtin.set_fact:
    rhel_tag: "{{ software_config.cluster_os_version }}"
    default_json_path: "{{ input_project_dir }}/config/aarch64/{{ software_config.cluster_os_type }}/{{ software_config.cluster_os_version }}/default_packages.json"  # noqa: yaml[line-length]
    additional_json_path: "{{ input_project_dir }}/config/aarch64/{{ software_config.cluster_os_type }}/{{ software_config.cluster_os_version }}/additional_packages.json"  # noqa: yaml[line-length]
    admin_debug_json_path: "{{ input_project_dir }}/config/aarch64/{{ software_config.cluster_os_type }}/{{ software_config.cluster_os_version }}/admin_debug_packages.json"  # noqa: yaml[line-length]

- name: Fetch pulp endpoint repos
  ansible.builtin.include_tasks: fetch_pulp_repos.yml
  when: fg_aarch64 or enable_build_stream

- name: Fetch packages for base and compute image softwares
  ansible.builtin.include_tasks: fetch_packages.yml
  when: fg_aarch64 or enable_build_stream


================================================
FILE: build_image_aarch64/roles/fetch_packages/vars/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

---

metadata_file_path: "/opt/omnia/offline_repo/.data/localrepo_metadata.yml"
local_repo_check_msg: |
  Failure: metadata file is not present at path {{ metadata_file_path }}.
  Please make sure that local_repo.yml playbook is executed successfully.
input_project_dir: "{{ hostvars['localhost']['input_project_dir'] }}"
functional_groups_file_path: "{{ hostvars['localhost']['functional_groups_config_path'] | default('/opt/omnia/.data/functional_groups_config.yml') }}"
software_config_file_path: "{{ input_project_dir }}/software_config.json"
aarch64_build_image_completion_msg: |
  The playbook build_image_aarch64.yml has been completed successfully.
  To boot x86_64 and aarch64 nodes execute discovery/discovery.yml playbook.
functional_group_absent_msg: |
  Failure: No aarch64 functional groups found in functional_group_config.yml input file.
  Please make sure aarch64 functional_group should be present in input file functional_group_config.yml
  to execute build_image_aarch64.yml successfully.
build_stream_prerequisite_fail_msg: |
  Build Stream mode is enabled. Manual execution is not supported.
  Please trigger this workflow via the GitLab pipeline.


================================================
FILE: build_image_aarch64/roles/image_creation/tasks/build_base_image.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Normalize build stream inputs for base image
  ansible.builtin.set_fact:
    enable_build_stream: "{{ enable_build_stream | default(false) | bool }}"
    build_stream_job_id: "{{ build_stream_job_id | default('') }}"
    image_key: "{{ image_key | default('') }}"
    base_image_suffix: ""

- name: Set base image suffix when build stream inputs present
  ansible.builtin.set_fact:
    base_image_suffix: "_{{ build_stream_job_id }}-{{ image_key | default('') }}"
    rhel_base_image_name: "{{ rhel_aarch64_base_image_name }}_{{ build_stream_job_id }}-{{ image_key | default('') }}"
  when:
    - enable_build_stream | bool
    - (build_stream_job_id | default('') | length) > 0
    - (image_key | default('') | length) > 0

- name: Create temporary inventory with ochami group
  ansible.builtin.copy:
    dest: "{{ aarch64_inventory_file }}"
    content: |
      [ochami]
      {{ groups['admin_aarch64'] | join('\n') }}
    mode: "{{ hostvars['localhost']['file_permissions_644'] }}"

- name: Create aarch64_base_image.log as a file
  ansible.builtin.file:
    path: "{{ openchami_aarch64_base_image_log_path }}"
    state: touch
    mode: "{{ dir_permissions_644 }}"

- name: Load the openchami image vars
  ansible.builtin.template:
    src: "{{ openchami_base_image_vars_template }}"
    dest: "{{ openchami_aarch64_base_image_vars_path }}"
    mode: "{{ dir_permissions_644 }}"

- name: Invoking Openchami playbook for rhel-base image build
  ansible.builtin.shell: |
    set -o pipefail
    ansible-playbook {{ openchami_clone_path }}/dell/podman-quadlets/image.yaml \
    -i {{ aarch64_inventory_file }} -v \
    --extra-vars "@{{ openchami_aarch64_base_image_vars_path }}" \
    --tags base_image -v | \
    /usr/bin/tee {{ openchami_aarch64_base_image_log_path }}
  async: 3600  # Set async timeout (e.g., 1 hour)
  poll: 0  # Non-blocking (continue the playbook without waiting for completion)
  register: base_image_build
  changed_when: true

- name: Wait for rhel-base image OpenCHAMI jobs to finish
  block:
    - name: Wait for rhel-base image OpenCHAMI jobs to finish
      ansible.builtin.async_status:
        jid: "{{ base_image_build.ansible_job_id }}"
      register: job_result
      until: job_result.finished
      retries: "{{ job_retry }}"
      delay: "{{ job_delay }}"
  rescue:
    - name: Fail the build if the base image build fails
      ansible.builtin.fail:
        msg: |
          {{ base_image_failure_msg }}

  always:
    - name: Remove generated base image vars file
      ansible.builtin.file:
        path: "{{ openchami_aarch64_base_image_vars_path }}"
        state: absent

    - name: Set openchami SELinux context
      ansible.builtin.command: chcon -R system_u:object_r:container_file_t:s0 "{{ oim_shared_path }}/omnia/openchami"
      changed_when: true
      delegate_to: oim
      connection: ssh
      failed_when: false


================================================
FILE: build_image_aarch64/roles/image_creation/tasks/build_compute_image.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Normalize build stream inputs
  ansible.builtin.set_fact:
    enable_build_stream: "{{ enable_build_stream | default(false) | bool }}"
    build_stream_job_id: "{{ build_stream_job_id | default('') }}"
    image_key: "{{ image_key | default('') }}"
    compute_image_suffix: ""

- name: Set compute image suffix when build stream inputs present
  ansible.builtin.set_fact:
    compute_image_suffix: "_{{ build_stream_job_id }}-{{ image_key | default('') }}"
  when:
    - enable_build_stream | bool
    - (build_stream_job_id | default('') | length) > 0
    - (image_key | default('') | length) > 0

- name: Create temporary inventory with ochami group
  ansible.builtin.copy:
    dest: "{{ aarch64_inventory_file }}"
    content: |
      [ochami]
      {{ groups['admin_aarch64'] | join('\n') }}
    mode: "{{ hostvars['localhost']['file_permissions_644'] }}"

- name: Create aarch64 compute image log files
  ansible.builtin.file:
    path: "{{ openchami_log_dir }}/{{ item.key }}{{ compute_image_suffix }}_compute_image.log"
    state: touch
    mode: "{{ dir_permissions_644 }}"
  loop: "{{ compute_images_dict | dict2items }}"
  loop_control:
    loop_var: item

- name: Render compute images templates
  ansible.builtin.template:
    src: "{{ openchami_compute_image_vars_template }}"
    dest: "{{ openchami_dir }}/{{ item.key }}{{ compute_image_suffix }}_compute_images.yaml"
    mode: "{{ dir_permissions_644 }}"
  vars:
    functional_group: "{{ item.value.functional_group }}"
    packages: "{{ item.value.packages }}"
    base_compute_image_name: "{{ item.key }}{{ compute_image_suffix }}"
    rhel_base_compute_image_name: "rhel-{{ item.key }}{{ compute_image_suffix }}"
  loop: "{{ compute_images_dict | dict2items }}"
  loop_control:
    loop_var: item

- name: Invoking OpenCHAMI playbooks asynchronously for aarch64 compute image_build
  ansible.builtin.shell: |
    set -o pipefail
    ansible-playbook {{ openchami_clone_path }}/dell/podman-quadlets/image.yaml \
    -i {{ aarch64_inventory_file }} -v \
      --extra-vars '@{{ openchami_dir }}/{{ item.key }}{{ compute_image_suffix }}_compute_images.yaml' \
      --tags compute_image -v | \
      /usr/bin/tee '{{ openchami_log_dir }}/{{ item.key }}{{ compute_image_suffix }}_compute_image.log'
  async: 3600   # Set async timeout (e.g., 1 hour)
  poll: 0   # Non-blocking (continue the playbook without waiting for completion)
  loop: "{{ compute_images_dict | dict2items }}"
  loop_control:
    loop_var: item
  register: compute_image_build_job
  changed_when: true

- name: Wait for all OpenCHAMI jobs to finish and remove generated compute images templates
  block:
    - name: Display image build jobs status
      ansible.builtin.debug:
        msg: "Waiting for image build: {{ item.item.key }} (Job ID: {{ item.ansible_job_id }})"
      loop: "{{ compute_image_build_job.results }}"
      loop_control:
        label: "{{ item.item.key }}"

    - name: Wait for all OpenCHAMI jobs to finish
      ansible.builtin.async_status:
        jid: "{{ item.ansible_job_id }}"
      register: job_result
      until: job_result.finished
      no_log: true
      retries: "{{ job_retry }}"
      delay: "{{ job_delay }}"
      loop: "{{ compute_image_build_job.results }}"
      loop_control:
        label: "Building: {{ item.item.key }}"

  rescue:
    - name: Identify failed image builds
      ansible.builtin.set_fact:
        failed_images: >
          {{ job_result.results
          | selectattr('failed', 'defined')
          | selectattr('failed', 'equalto', true)
          | map(attribute='item.item.key')
          | list }}
      when: job_result.results is defined

    - name: Build failure message list
      ansible.builtin.set_fact:
        failure_msg_list:
          - "aarch64 compute image build job did not complete successfully."
          - "Check logs at {{ openchami_log_dir }} for respective functional group for more details."
          - ""
          - "Failed images:"

    - name: Add failed image names to message
      ansible.builtin.set_fact:
        failure_msg_list: "{{ failure_msg_list + ['  - ' + item] }}"
      loop: "{{ failed_images | default(['Unknown - check all logs']) }}"

    - name: Add log paths section to message
      ansible.builtin.set_fact:
        failure_msg_list: "{{ failure_msg_list + ['', 'Check logs at ' + openchami_log_dir + ' for details:'] }}"

    - name: Add log file paths to message
      ansible.builtin.set_fact:
        failure_msg_list: "{{ failure_msg_list + ['  - ' + openchami_log_dir + '/' + item + log_suffix + '_compute_image.log'] }}"
      vars:
        log_suffix: "{{ compute_image_suffix }}"
      loop: "{{ failed_images | default([]) }}"

    - name: Display aarch64 compute image build failure details
      ansible.builtin.debug:
        msg: "{{ failure_msg_list }}"

    - name: Failed to build the aarch64 compute image
      ansible.builtin.fail:
        msg: "aarch64 compute image build failed. See details above."

  always:
    - name: Remove generated compute images templates
      ansible.builtin.file:
        path: "{{ openchami_dir }}/{{ item.key }}{{ compute_image_suffix }}_compute_images.yaml"
        state: absent
      loop: "{{ compute_images_dict | dict2items }}"
      loop_control:
        loop_var: item

    - name: Remove temporary inventory file
      ansible.builtin.file:
        path: "{{ aarch64_inventory_file }}"
        state: absent

    - name: Set openchami SELinux context
      ansible.builtin.command: chcon -R system_u:object_r:container_file_t:s0 "{{ oim_shared_path }}/omnia/openchami"
      changed_when: true
      delegate_to: oim
      connection: ssh
      failed_when: false


================================================
FILE: build_image_aarch64/roles/image_creation/tasks/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Include metadata vars
  ansible.builtin.include_vars: "{{ omnia_metadata_file }}"
  register: include_metadata
  no_log: true

- name: Include global variables from common folder
  ansible.builtin.include_vars: "{{ role_path }}/../../../common/vars/openchami_image_cmd.yml"
  register: ochami_image_global_vars

- name: Invoking aarch64 build base image playbook
  ansible.builtin.include_tasks: build_base_image.yml
  tags: base_image

- name: Invoking aarch64 build rhel compute image playbooks
  ansible.builtin.include_tasks: build_compute_image.yml
  tags: compute_image


================================================
FILE: build_image_aarch64/roles/image_creation/templates/base_image_template.j2
================================================
openchami_work_dir: "{{ openchami_work_dir }}"
rhel_tag: "{{ rhel_tag }}"
rhel_base_image_name: "{{ rhel_aarch64_base_image_name }}"
rhel_base_image: "{{ oim_node_name }}/{{ rhel_aarch64_base_image_name }}"
cluster_name: "{{ oim_node_name }}"
cluster_domain: "{{ domain_name }}"
group_name: base
rhel_base_mounts: {{ ochami_mounts | join(' ') }}
image_build_name: {{ ochami_aarch64_image | join(' ') }}
rhel_base_command_options: {{ ochami_base_command | join(' ') }}

rhel_repos:
{% for repo in rhel_aarch64_repos %}
  - { name: '{{ repo.name }}', url: '{{ repo.base_url }}', gpg: '{{ repo.gpg }}' }
{% endfor %}

base_image_packages:
{% for pkg in aarch64_base_image_packages %}
  - {{ pkg }}
{% endfor %}

base_image_commands:
{% for cmd in base_image_commands %}
  - {{ cmd | to_json }}
{% endfor %}


================================================
FILE: build_image_aarch64/roles/image_creation/templates/compute_images_templates.j2
================================================
openchami_work_dir: "{{ openchami_work_dir }}"
rhel_tag: "{{ rhel_tag }}"
rhel_base_image: "{{ oim_node_name }}/{{ rhel_aarch64_base_image_name }}"
{% set image_name_suffix = compute_image_suffix | default('') %}
base_compute_image_name: "{{ item.key }}{{ image_name_suffix }}"
rhel_base_compute_image_name: "rhel-{{ item.key }}{{ image_name_suffix }}"
rhel_base_compute_image: "{{ oim_node_name }}/rhel-{{ item.key }}{{ image_name_suffix }}"
# S3 directory should stay stable (no job-id) while the filename will carry job-id via image name
s3_dir_name: "rhel-{{ item.key }}"
cluster_name: "{{ oim_node_name }}"
cluster_domain: "{{ domain_name }}"
group_name: "{{ item.key }}"
rhel_base_compute_mounts: --user 0 --privileged -v {{ oim_shared_path }}/omnia/pulp/settings/certs/pulp_webserver.crt:/etc/pki/ca-trust/source/anchors/pulp_webserver.crt:z -v {{ openchami_work_dir }}/images/{{ rhel_base_compute_image_name }}-{{ rhel_tag }}.yaml:/home/builder/config.yaml:z
image_build_name: {{ ochami_aarch64_image  | join (' ') }}
rhel_base_compute_command_options: {{ ochami_base_command | join (' ') }}
minio_s3_username: "{{ minio_s3_username }}"
minio_s3_password: "{{ minio_s3_password }}"
{% set s3_prefix_suffix = '' %}
s3_prefix_suffix: "{{ s3_prefix_suffix }}"
# Override OpenCHAMI defaults to ensure correct mount path
rhel_tag: "{{ rhel_tag }}"

rhel_repos:
{% set rhel_repo = rhel_aarch64_repos %}
{% for repo in rhel_repo %}
  - { name: '{{ repo.name }}', url: '{{ repo.base_url }}', gpg: '{{ repo.gpg }}' }
{% endfor %}

base_compute_image_packages:
{% for pkg in packages %}
  - {{ pkg }}
{% endfor %}

# Commands for this role
{% set command_var = functional_group + '_compute_commands' %}
{% set commands_list = lookup('vars', command_var, default=[]) %}
base_compute_image_commands:
{% if commands_list | length > 0 %}
{% for cmd in commands_list %}
  - "{{ cmd }}"
{% endfor %}
{% else %}
  []
{% endif %}


================================================
FILE: build_image_aarch64/roles/image_creation/vars/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

input_project_dir: "{{ hostvars['localhost']['input_project_dir'] }}"
omnia_metadata_file: "/opt/omnia/.data/oim_metadata.yml"
dir_permissions_644: "0644"
dir_permissions_755: "0755"
aarch64_local_tag: "aarch64-image-builder/ochami"
openchami_dir: "/opt/omnia/openchami"
openchami_clone_path: /opt/omnia/openchami/deployment-recipes
job_retry: "120"
job_delay: "30"
openchami_work_dir: "{{ oim_shared_path }}/omnia/openchami/workdir"
ochami_mounts:
  - --user 0 --privileged
  - -v {{ oim_shared_path }}/omnia/pulp/settings/certs/pulp_webserver.crt:/etc/pki/ca-trust/source/anchors/pulp_webserver.crt:z
  - -v {{ openchami_work_dir }}/images/{{ rhel_aarch64_base_image_name }}-{{ rhel_tag }}.yaml:/home/builder/config.yaml:z
ochami_compute_mounts:
  - --user 0 --privileged
  - -v {{ oim_shared_path }}/omnia/pulp/settings/certs/pulp_webserver.crt:/etc/pki/ca-trust/source/anchors/pulp_webserver.crt:z
  - -v {{ openchami_work_dir }}/images/{{ rhel_base_compute_image_name }}-{{ rhel_tag }}.yaml:/home/builder/config.yaml:z
ochami_aarch64_image:
  - --entrypoint /bin/bash
  - "localhost/{{ aarch64_local_tag }}"
ochami_base_command:
  - -c 'update-ca-trust extract && image-build --config /home/builder/config.yaml --log-level DEBUG'


# Usage: build_base_image.yml
openchami_log_dir: /opt/omnia/log/openchami
openchami_aarch64_base_image_log_path: "{{ openchami_log_dir }}/aarch64_base_image.log"
openchami_base_image_vars_template: "{{ role_path }}/templates/base_image_template.j2"
openchami_aarch64_base_image_vars_path: "/opt/omnia/openchami/aarch64_base_image_template.yaml"
aarch64_inventory_file: "/tmp/temp_ochami_inventory.ini"
base_image_failure_msg: |
  Base aarch64 image build job failed or timed out.
  Check logs at path {{ openchami_aarch64_base_image_log_path }} for details.
compute_image_failure_msg: |
  aarch64 compute image build job did not complete successfully.
  Check logs at {{ openchami_log_dir }} for respective functional group for more details.

# Usage: build_compute_image.yml
openchami_compute_image_vars_template: "{{ role_path }}/templates/compute_images_templates.j2"
openchami_compute_image_vars_path: "/opt/omnia/openchami/compute_images_template.yaml"


================================================
FILE: build_image_aarch64/roles/prepare_arm_node/tasks/gather_oim_data.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# Inventory Validation
- name: Fail if no inventory provided
  ansible.builtin.fail:
    msg: "{{ no_inventory_error_msg }}"
  when: groups['all'] | length == 0

- name: Fail if inventory group 'admin_aarch64' is empty
  ansible.builtin.fail:
    msg: "{{ admin_aarch64_empty_error_msg }}"
  when: groups['admin_aarch64'] is not defined or groups['admin_aarch64'] | length == 0

- name: Fail if inventory group 'admin_aarch64' has more than one host
  ansible.builtin.fail:
    msg: "{{ admin_aarch64_count_error_msg }}"
  when: groups['admin_aarch64'] | length != 1

# Validate share option
- name: Set share option fact
  ansible.builtin.set_fact:
    omnia_share_option: "{{ hostvars['localhost']['omnia_share_option'] }}"

- name: Fail if share option is not NFS
  ansible.builtin.fail:
    msg: "{{ nfs_not_configured_msg }}"
  when: omnia_share_option != "NFS"

# Load network specification
- name: Load network spec file
  ansible.builtin.include_vars:
    file: "{{ network_spec }}"
  register: include_network_spec
  no_log: true

- name: Fail if network spec cannot be loaded
  ansible.builtin.fail:
    msg: "{{ network_spec_syntax_fail_msg }} Error: {{ include_network_spec.message }}"
  when: include_network_spec is failed

# Parse network spec data
- name: Parse network spec
  ansible.builtin.set_fact:
    network_data: "{{ network_data | default({}) | combine({item.key: item.value}) }}"
  with_dict: "{{ Networks }}"

# Set PXE IP fact
- name: Set PXE IP fact
  ansible.builtin.set_fact:
    oim_pxe_ip: "{{ network_data.admin_network.primary_oim_admin_ip }}"
    cacheable: true

- name: Create aarch64 directory if not exists
  ansible.builtin.file:
    path: "{{ ochami_aarch_64_dir }}"
    state: directory
    mode: "{{ hostvars['localhost']['dir_permissions_755'] }}"

# Validate pulp.repo existence
- name: Check if pulp.repo exists
  ansible.builtin.stat:
    path: "{{ pulp_repo_file_path }}"
  register: pulp_repo_stat

# Handle missing pulp.repo
- name: Notify if pulp.repo is missing
  ansible.builtin.fail:
    msg: "{{ pulp_repo_missing_error_msg }}"
  when: not pulp_repo_stat.stat.exists

# Read pulp.repo file
- name: Read pulp.repo content
  ansible.builtin.slurp:
    path: "{{ pulp_repo_file_path }}"
  register: pulp_repo_content
  when: pulp_repo_stat.stat.exists

- name: Extract aarch64_baseos repo section
  ansible.builtin.set_fact:
    aarch64_baseos_repo: >-
      {{
        (pulp_repo_content.content | b64decode)
        | regex_search(
            '''(?s)\[aarch64_baseos\].*?(?=\n\[|\Z)'''
          )
      }}
  when: pulp_repo_stat.stat.exists

# Fail if aarch64_appstream repo is not found
- name: Fail if aarch64_baseos repo section is missing
  ansible.builtin.fail:
    msg: "{{ repo_not_found_error_msg }}"
  when: aarch64_baseos_repo is not defined or aarch64_baseos_repo | length == 0

# Write only aarch64_appstream repo into new pulp.repo
- name: Write aarch64_appstream repo into pulp repo path
  ansible.builtin.copy:
    content: "{{ aarch64_baseos_repo }}"
    dest: "{{ pulp_repo_store_path }}"
    mode: "{{ hostvars['localhost']['file_permissions_644'] }}"
  when: aarch64_baseos_repo is defined


================================================
FILE: build_image_aarch64/roles/prepare_arm_node/tasks/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Add target host to known_hosts
  ansible.builtin.known_hosts:
    name: "{{ inventory_hostname }}"
    key: "{{ lookup('pipe', 'ssh-keyscan -H ' + inventory_hostname) }}"
  delegate_to: localhost

- name: Check if passwordless SSH is enabled
  ansible.builtin.command:
    cmd: ssh -o BatchMode=yes -o ConnectTimeout=5 root@{{ inventory_hostname }} 'echo OK'
  register: ssh_check
  ignore_errors: true
  changed_when: false
  delegate_to: localhost

# Set up passwordless SSH from localhost if not already enabled
- name: Setup passwordless SSH from localhost
  ansible.builtin.expect:
    command: "ssh-copy-id -i /root/.ssh/id_rsa.pub root@{{ inventory_hostname }}"
    responses:
      "password:": "{{ hostvars['localhost']['provision_password'] }}"
  when: ssh_check.failed
  delegate_to: localhost
  no_log: true

- name: Verify passwordless SSH
  ansible.builtin.command:
    cmd: ssh -o BatchMode=yes root@{{ inventory_hostname }} 'echo OK'
  register: ssh_verify
  failed_when: ssh_verify.stdout != "OK"
  changed_when: false
  delegate_to: localhost

# Check the machine architecture of the target host
- name: Check machine architecture
  ansible.builtin.command: uname -m
  register: arch_result
  changed_when: false

# Fail the play if the target machine is not aarch64
- name: Fail if machine is not aarch64
  ansible.builtin.fail:
    msg: "{{ not_aarch64_error_msg }}"
  when: arch_result.stdout != "aarch64"

- name: Remove any existing entries for OIM hostname in /etc/hosts
  ansible.builtin.lineinfile:
    path: /etc/hosts
    regexp: '.*\s+{{ hostvars["localhost"]["oim_hostname"] }}$'
    state: absent
  changed_when: true

- name: Add correct OIM PXE IP and hostname to /etc/hosts
  ansible.builtin.lineinfile:
    path: /etc/hosts
    line: "{{ hostvars['localhost']['oim_pxe_ip'] }} {{ hostvars['localhost']['oim_hostname'] }}"
    state: present
    mode: "{{ hostvars['localhost']['file_permissions_644'] }}"
    create: true

# Verify the entry exists in /etc/hosts
- name: Verify OIM PXE IP and hostname in /etc/hosts
  ansible.builtin.command:
    cmd: "grep {{ hostvars['localhost']['oim_pxe_ip'] }} /etc/hosts"
  register: etc_hosts_check
  changed_when: false
  failed_when: etc_hosts_check.stdout == ""

- name: Display verification result
  ansible.builtin.debug:
    msg: "Entry in /etc/hosts: {{ etc_hosts_check.stdout }}"

- name: Ping OIM hostname from target host
  ansible.builtin.raw: "ping -c 2 {{ hostvars['localhost']['oim_hostname'] }}"
  register: ping_result
  changed_when: false
  failed_when: ping_result.rc != 0

- name: Show ping result
  ansible.builtin.debug:
    msg: "{{ ping_result.stdout }}"

# Register NFS details
- name: Set NFS info fact
  ansible.builtin.set_fact:
    nfs_info:
      server_ip: "{{ hostvars['localhost']['nfs_server_ip'] }}"
      server_share_path: "{{ hostvars['localhost']['nfs_server_share_path'] }}"
      shared_path: "{{ hostvars['localhost']['oim_shared_path'] }}"

- name: Ensure NFS mount point directory exists
  ansible.builtin.file:
    path: "{{ nfs_info.shared_path }}"
    state: directory
    mode: "{{ hostvars['localhost']['dir_permissions_755'] }}"
  become: true

- name: Copy pulp.repo from omnia_core to target host
  ansible.builtin.copy:
    src: "{{ pulp_repo_store_path }}"
    dest: "{{ pulp_repo_file_path }}"
    mode: "{{ hostvars['localhost']['file_permissions_644'] }}"

- name: Copy pulp webserver certificate to target host
  ansible.builtin.copy:
    src: "{{ pulp_webserver_cert_path }}"
    dest: "{{ anchors_path }}"
    mode: "{{ hostvars['localhost']['file_permissions_644'] }}"
  become: true

- name: Update CA trust on target host
  ansible.builtin.command: update-ca-trust
  register: update_ca
  changed_when: false

- name: Check if NFS is mounted
  ansible.builtin.command:
    cmd: "mountpoint -q {{ nfs_info.shared_path }}"
  register: nfs_mounted
  ignore_errors: true
  changed_when: false

# Install NFS client package
- name: Install NFS client package
  ansible.builtin.dnf:
    name: nfs-utils
    state: present
  when: nfs_mounted.rc != 0
  become: true

# Mount NFS share if not mounted
- name: Mount NFS share
  ansible.builtin.mount:
    path: "{{ nfs_info.shared_path }}"
    src: "{{ nfs_info.server_ip }}:{{ nfs_info.server_share_path }}"
    fstype: nfs
    opts: defaults
    state: mounted
  when: nfs_mounted.rc != 0
  become: true

# Verify the mount
- name: Verify NFS mount
  ansible.builtin.command:
    cmd: "mountpoint -q {{ nfs_info.shared_path }}"
  register: verify_nfs
  failed_when: verify_nfs.rc != 0
  changed_when: false

- name: Display NFS mount status
  ansible.builtin.debug:
    msg: "NFS share {{ nfs_info.server_ip }}:{{ nfs_info.server_share_path }} is mounted on {{ nfs_info.shared_path }}"

- name: Build full Podman image path
  ansible.builtin.set_fact:
    pulp_aarch_image: "{{ hostvars['localhost']['oim_pxe_ip'] }}:2225/{{ pulp_aarch64_image_name }}"

- name: Pull and tag aarch64 image
  block:
    - name: Pull aarch64 image using Podman
      containers.podman.podman_image:
        name: "{{ pulp_aarch_image }}"
        state: present
      register: podman_pull_result
      retries: "{{ pull_image_retries }}"
      delay: "{{ pull_image_delay }}"
      until: podman_pull_result is not failed
      changed_when: false

    - name: Tag pulled image
      containers.podman.podman_tag:
        image: "{{ pulp_aarch_image }}"
        target_names:
          - "{{ aarch64_local_tag }}"
      changed_when: false

  rescue:
    - name: Fail if Podman pull failed
      ansible.builtin.fail:
        msg: "Failed to pull image {{ pulp_aarch_image }}"

- name: Check if regctl binary exists
  ansible.builtin.stat:
    path: "{{ ochami_aarch_64_dir }}/regctl"
  register: regctl_stat
  delegate_to: localhost

- name: Fail if regctl binary not found
  ansible.builtin.fail:
    msg: "{{ regctl_not_found_msg }}"
  when: not regctl_stat.stat.exists

- name: Copy regctl binary to /usr/local/bin on target host
  ansible.builtin.copy:
    src: "{{ ochami_aarch_64_dir }}/regctl"
    dest: "{{ regctl_bin_path }}"
    mode: "{{ hostvars['localhost']['dir_permissions_755'] }}"
  become: true

- name: Set registry TLS option using regctl
  ansible.builtin.command: "{{ regctl_bin_path }} registry set --tls disabled {{ hostvars['localhost']['oim_hostname'] }}:5000"
  register: regctl_result
  changed_when: regctl_result.rc == 0
  become: true


================================================
FILE: build_image_aarch64/roles/prepare_arm_node/vars/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# input files
input_project_dir: "{{ hostvars['localhost']['input_project_dir'] }}"
pulp_aarch64_image_name: "dellhpcomniaaisolution/image-build-aarch64:1.1"
aarch64_local_tag: "aarch64-image-builder/ochami"
pull_image_retries: "3"
pull_image_delay: "10"
network_spec: "{{ input_project_dir }}/network_spec.yml"
ochami_aarch_64_dir: "/opt/omnia/openchami/aarch64"
pulp_repo_store_path: "{{ ochami_aarch_64_dir }}/pulp.repo"
pulp_repo_file_path: "/etc/yum.repos.d/pulp.repo"
pulp_webserver_cert_path: "/opt/omnia/pulp/settings/certs/pulp_webserver.crt"
anchors_path: "/etc/pki/ca-trust/source/anchors/pulp_webserver.crt"
regctl_bin_path: "/usr/local/bin/regctl"

# Error messages
no_inventory_error_msg: "No inventory provided. Please specify an inventory with -i option."
admin_aarch64_empty_error_msg: "The inventory group 'admin_aarch64' does not exist or has no hosts."
admin_aarch64_count_error_msg: "The inventory group 'admin_aarch64' must have exactly one host."
network_spec_syntax_fail_msg: "Failed to load network_spec.yml due to syntax error"
pulp_repo_missing_error_msg: "pulp.repo file not found. Please run local_repo.yml playbook to create a repo file."
not_aarch64_error_msg: "This is not an aarch64 machine. Only ARM nodes can be used to build the image."
repo_not_found_error_msg: "The aarch64_baseos repo section is not available in pulp.repo"
nfs_not_configured_msg: >
  To build aarch64 images on an ARM node, the NFS server must be configured on the OIM.
  Please run oim_cleanup.yml and reinstall the omnia_core container with the NFS option.
aarch64_image_fail_msg: >
  Unable to pull the Ochami aarch64 image builder image.
  Make sure you have added the default package for aarch64 in the software_config.json file and ran local_repo.yml.
  If not, add that package and rerun local_repo.yml.
regctl_not_found_msg: >
  regctl binary not found at {{ ochami_aarch_64_dir }}/regctl.
  Please run prepare_oim.yml playbook to download the regctl binary.


================================================
FILE: build_image_x86_64/ansible.cfg
================================================
[defaults]
log_path = /opt/omnia/log/core/playbooks/build_image_x86_64.yml
remote_tmp = /opt/omnia/tmp/.ansible/tmp/
host_key_checking = false
forks = 5
timeout = 180
executable = /bin/bash
library = ../common/library/modules
module_utils = ../common/library/module_utils

[persistent_connection]
command_timeout = 180
connect_timeout = 180

[ssh_connection]
retries = 3
ssh_args = -o ControlMaster=auto -o ControlPersist=60 -o ConnectTimeout=60


================================================
FILE: build_image_x86_64/build_image_x86_64.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Check if upgrade is in progress
  ansible.builtin.import_playbook: ../utils/upgrade_checkup.yml

- name: Set_fact for fetch omnia config credentials
  hosts: localhost
  connection: local
  tags: always
  tasks:
    - name: Set dynamic run tags including 'build_image'
      when: not config_file_status | default(false) | bool
      ansible.builtin.set_fact:
        omnia_run_tags: "{{ (ansible_run_tags | default([]) + ['build_image']) | unique }}"
        cacheable: true

- name: Invoke validate_config.yml to perform L1 and L2 validations with build_image tag
  ansible.builtin.import_playbook: ../input_validation/validate_config.yml
  tags: always

- name: Invoke get_config_credentials.yml
  ansible.builtin.import_playbook: ../utils/credential_utility/get_config_credentials.yml

- name: Include input project directory
  when: not project_dir_status | default(false) | bool
  ansible.builtin.import_playbook: ../utils/include_input_dir.yml
  vars:
    openchami_vars_suppport: true
    omnia_metadata_support: true

- name: Load build_stream configuration
  hosts: localhost
  connection: local
  gather_facts: false
  tags: always
  tasks:
    - name: Include build_stream config file
      ansible.builtin.include_vars:
        file: "{{ input_project_dir }}/build_stream_config.yml"
      failed_when: false

    - name: Set build_stream variables from extra_vars
      ansible.builtin.set_fact:
        build_stream_job_id: "{{ job_id | default('') }}"
        build_stream_image_key: "{{ image_key | default('') }}"
        build_stream_functional_groups: "{{ functional_groups | default([]) }}"
        enable_build_stream_flag: "{{ enable_build_stream | default(false) | bool }}"

    - name: Debug - Show build_stream variables
      ansible.builtin.debug:
        msg:
          - "build_stream_job_id: {{ build_stream_job_id }}"
          - "build_stream_image_key: {{ build_stream_image_key }}"
          - "build_stream_functional_groups: {{ build_stream_functional_groups }}"
          - "enable_build_stream_flag: {{ enable_build_stream_flag }}"
        verbosity: 2

    - name: Fetch build_stream prerequisites
      ansible.builtin.include_role:
        name: fetch_packages
        tasks_from: build_stream_prerequisite.yml
      vars:
        job_id: "{{ build_stream_job_id }}"
        image_key: "{{ build_stream_image_key }}"
        functional_groups: "{{ build_stream_functional_groups }}"
        enable_build_stream: "{{ enable_build_stream_flag }}"
      when: enable_build_stream_flag

- name: Create oim group and provision group
  ansible.builtin.import_playbook: ../utils/create_container_group.yml
  vars:
    oim_group: true
  tags: always

- name: Configure auth for OpenCHAMI
  hosts: oim
  connection: ssh
  tasks:
    - name: OpenCHAMI cluster authentication
      ansible.builtin.include_tasks: "{{ playbook_dir }}/../common/tasks/common/openchami_auth.yml"
      vars:
        oim_node_name: "{{ hostvars['localhost']['oim_node_name'] }}"

- name: Generate functional groups configuration when enable_build_stream is false
  ansible.builtin.import_playbook: ../utils/generate_functional_groups.yml
  tags: always
  when: not enable_build_stream

- name: Verify x86_64 functional_group presnt
  hosts: localhost
  connection: local
  tasks:
    - name: Fetch x86_64 functional_groups
      ansible.builtin.include_role:
        name: fetch_packages
        tasks_from: check_x86_64_fg.yml
      when: not enable_build_stream

- name: Fetch packages for x86_64
  hosts: localhost
  connection: local
  gather_facts: false
  roles:
    - fetch_packages

- name: Tagging OpenCHAMI image
  hosts: oim
  connection: ssh
  tasks:
    - name: Tag OpenCHAMI image
      ansible.builtin.include_role:
        name: image_creation
        tasks_from: prepare_pulp_image.yml

- name: OpenCHAMI build image for x86_64
  hosts: localhost
  connection: local
  gather_facts: false
  roles:
    - image_creation

- name: Build x86_64 image completion
  hosts: localhost
  connection: local
  tasks:
    - name: Build Image completion
      ansible.builtin.include_role:
        name: fetch_packages
        tasks_from: x86_64_build_image_completion.yml


================================================
FILE: build_image_x86_64/roles/fetch_packages/tasks/build_stream_prerequisite.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Debug - Show explicitly passed variables
  ansible.builtin.debug:
    msg:
      - "job_id: {{ job_id | default('NOT_SET') }}"
      - "image_key: {{ image_key | default('NOT_SET') }}"
      - "functional_groups: {{ functional_groups | default('NOT_SET') }}"
      - "enable_build_stream: {{ enable_build_stream | default('NOT_SET') }}"
    verbosity: 2

- name: Set build_stream variables from explicitly passed values
  ansible.builtin.set_fact:
    build_stream_job_id: "{{ job_id }}"
    image_key: "{{ image_key }}"
    cacheable: true

- name: Normalize functional_groups input into list
  ansible.builtin.set_fact:
    functional_group_list: "{{ functional_groups if functional_groups is iterable and functional_groups is not string else (functional_groups | from_yaml) }}"
  when: functional_groups is defined and enable_build_stream

- name: Fail when build stream enabled without job id or functional groups
  ansible.builtin.fail:
    msg: "{{ build_stream_prerequisite_fail_msg }}"
  when:
    - enable_build_stream | bool
    - (build_stream_job_id | default('') | string) | length == 0 or (functional_group_list | default([]) | length == 0) or (image_key | default('') | string) | length == 0   # noqa: yaml[line-length]


================================================
FILE: build_image_x86_64/roles/fetch_packages/tasks/check_x86_64_fg.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Load functional_group_config.yml
  ansible.builtin.include_vars:
    file: "{{ functional_groups_config_path }}"
    name: functional_group_cfg

- name: Check for x86_64 functional groups
  ansible.builtin.set_fact:
    fg_x86_64: >-
      {{ functional_group_cfg.functional_groups
         | selectattr('name', 'search', '_x86_64$')
         | list
         | length > 0 }}
    cacheable: true

- name: Fail if x86_64 functional groups are not present
  ansible.builtin.fail:
    msg: "{{ functional_group_absent_msg.splitlines() | join(' ') }}"
  when: not fg_x86_64


================================================
FILE: build_image_x86_64/roles/fetch_packages/tasks/fetch_packages.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Fetch x86_64 default_packages.json and additional_packages.json software packages
  block:
    - name: Collect base image RPM packages (default + additional + admin_debug)
      base_image_package_collector:
        default_json_path: "{{ default_json_path }}"
        additional_json_path: "{{ additional_json_path | default('') }}"
        admin_debug_json_path: "{{ admin_debug_json_path | default('') }}"
        software_config_path: "{{ software_config_file_path }}"
      register: base_image_output

    - name: Set x86_64_base_image_packages
      ansible.builtin.set_fact:
        x86_64_base_image_packages: "{{ base_image_output.base_image_packages }}"

    - name: Debug package x86_64_base_image_packages
      ansible.builtin.debug:
        var: x86_64_base_image_packages
        verbosity: 2

    - name: Parse functional_group_config.yml to list
      functional_group_parser:
        functional_groups_file: "{{ functional_groups_file_path }}"
      register: functional_group_parser_list
      when: not enable_build_stream

    - name: Set fact for functional_group_list
      ansible.builtin.set_fact:
        functional_group_list: "{{ functional_group_parser_list.functional_groups }}"
      when: not enable_build_stream

    - name: Debug full functional group parser output
      ansible.builtin.debug:
        var: functional_group_list
        verbosity: 2

    - name: Read packages for compute image softwares
      image_package_collector:
        functional_groups: "{{ functional_group_list }}"
        software_config_file: "{{ software_config_file_path }}"
        input_project_dir: "{{ input_project_dir }}"
        additional_json_path: "{{ additional_json_path }}"
      register: compute_images_output

    - name: Save packages for x86_64 keys in compute_images_dict
      ansible.builtin.set_fact:
        compute_images_dict: >-
          {{
            compute_images_output.compute_images_dict
            | dict2items
            | selectattr('key', 'search', '_x86_64$')
            | items2dict
          }}

    - name: Debug software directory compute_images_dict
      ansible.builtin.debug:
        var: compute_images_dict
        verbosity: 2


================================================
FILE: build_image_x86_64/roles/fetch_packages/tasks/fetch_pulp_repos.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Fetch pulp endpoints when x86_64 build_stream enabled
  block:
    - name: Fetch pulp endpoints for x86_64
      ansible.builtin.command: >
        pulp rpm distribution list --field name,base_url
      register: pulp_endpoints
      changed_when: false

    - name: Filter only x86_64 distributions
      ansible.builtin.set_fact:
        pulp_x86_64_distributions: >-
          {{ pulp_endpoints.stdout | from_json
            | selectattr('name', 'match', '^x86_64')
            | list }}

    - name: Build rhel_repos list from pulp_x86_64_distributions
      ansible.builtin.set_fact:
        rhel_x86_64_repos: >-
          {{ pulp_x86_64_distributions | map('combine', {'gpg': ''}) | list }}

    - name: Debug rhel_x86_64_repos
      ansible.builtin.debug:
        msg: "{{ rhel_x86_64_repos | to_nice_yaml(indent=2) }}"
        verbosity: 2


================================================
FILE: build_image_x86_64/roles/fetch_packages/tasks/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
- name: Check local_repo.yml execution
  block:
    - name: Check if metadata file exists
      ansible.builtin.stat:
        path: "{{ metadata_file_path }}"
      register: metadata_file_status

    - name: Fail if metadata file is not present
      ansible.builtin.fail:
        msg: "{{ local_repo_check_msg }}"
      when: not metadata_file_status.stat.exists

- name: Initialize fg_x86_64 as false
  ansible.builtin.set_fact:
    fg_x86_64: "{{ fg_x86_64 | default(false) }}"
  when: enable_build_stream | default(false)

- name: Include functional groups config
  ansible.builtin.include_vars:
    file: "{{ functional_groups_file_path }}"
    name: functional_groups_config
  when: not enable_build_stream

- name: Set functional_groups_file_path for build_stream disabled flow
  ansible.builtin.set_fact:
    functional_groups_file_path: "{{ functional_groups_file_path }}"
  when: not enable_build_stream

- name: Include software config
  ansible.builtin.include_vars:
    file: "{{ software_config_file_path }}"
    name: software_config
  when: enable_build_stream | default(false)

- name: Set cluster OS facts
  ansible.builtin.set_fact:
    rhel_tag: "{{ software_config.cluster_os_version }}"
    default_json_path: "{{ input_project_dir }}/config/x86_64/{{ software_config.cluster_os_type }}/{{ software_config.cluster_os_version }}/default_packages.json"   # noqa: yaml[line-length]
    additional_json_path: "{{ input_project_dir }}/config/x86_64/{{ software_config.cluster_os_type }}/{{ software_config.cluster_os_version }}/additional_packages.json"   # noqa: yaml[line-length]
    admin_debug_json_path: "{{ input_project_dir }}/config/x86_64/{{ software_config.cluster_os_type }}/{{ software_config.cluster_os_version }}/admin_debug_packages.json"  # noqa: yaml[line-length]

- name: Fetch pulp endpoint repos
  ansible.builtin.include_tasks: fetch_pulp_repos.yml
  when: fg_x86_64 or enable_build_stream

- name: Fetch packages for base and compute image softwares
  ansible.builtin.include_tasks: fetch_packages.yml
  when: fg_x86_64 or enable_build_stream


================================================
FILE: build_image_x86_64/roles/fetch_packages/tasks/x86_64_build_image_completion.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Build Image completion
  ansible.builtin.debug:
    msg: "{{ x86_64_build_image_completion_msg.splitlines() | join(' ') }}"


================================================
FILE: build_image_x86_64/roles/fetch_packages/vars/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

---

metadata_file_path: "/opt/omnia/offline_repo/.data/localrepo_metadata.yml"
local_repo_check_msg: |
  Failure: metadata file path {{ metadata_file_path }} is not present.
  Please make sure that local_repo.yml playbook is executed successfully.
input_project_dir: "{{ hostvars['localhost']['input_project_dir'] }}"
functional_groups_file_path: "{{ hostvars['localhost']['functional_groups_config_path'] | default('/opt/omnia/.data/functional_groups_config.yml') }}"
software_config_file_path: "{{ input_project_dir }}/software_config.json"
x86_64_build_image_completion_msg: |
  The playbook build_image_x86_64.yml has been completed successfully.
  To boot x86_64 nodes execute discovery/discovery.yml playbook.
  To build image for aarch64 nodes execute build_image_aarch64/build_image_aarch64.yml playbook.
functional_group_absent_msg: |
  Failure: No x86_64 functional groups found in functional_group_config.yml input file.
  Please make sure x86_64 functional_group should be present in input file functional_group_config.yml
  to execute build_image_x86_64.yml successfully.
build_stream_prerequisite_fail_msg: |
  Build Stream mode is enabled. Manual execution is not supported.
  Please trigger this workflow via the GitLab pipeline.


================================================
FILE: build_image_x86_64/roles/image_creation/tasks/build_base_image.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Normalize build stream inputs for base image
  ansible.builtin.set_fact:
    enable_build_stream: "{{ enable_build_stream | default(false) | bool }}"
    build_stream_job_id: "{{ build_stream_job_id | default('') }}"
    image_key: "{{ image_key | default('') }}"
    base_image_suffix: ""

- name: Set base image suffix when build stream inputs present
  ansible.builtin.set_fact:
    base_image_suffix: "_{{ build_stream_job_id }}-{{ image_key | default('') }}"
    rhel_base_image_name: "{{ rhel_x86_64_base_image_name }}_{{ build_stream_job_id }}-{{ image_key | default('') }}"
  when:
    - enable_build_stream | bool
    - (build_stream_job_id | default('') | length) > 0
    - (image_key | default('') | length) > 0

- name: Create x86_64_base_image.log as a file
  ansible.builtin.file:
    path: "{{ openchami_x86_64_base_image_log_path }}"
    state: touch
    mode: "{{ dir_permissions_644 }}"

- name: Load the openchami image vars
  ansible.builtin.template:
    src: "{{ openchami_base_image_vars_template }}"
    dest: "{{ openchami_x86_64_base_image_vars_path }}"
    mode: "{{ dir_permissions_644 }}"

- name: Invoking Openchami playbook for rhel-base image build
  ansible.builtin.shell: |
    set -o pipefail
    ansible-playbook {{ openchami_clone_path }}/dell/podman-quadlets/image.yaml \
    -i {{ openchami_clone_path }}/dell/podman-quadlets/inventory -v \
    --extra-vars "@{{ openchami_x86_64_base_image_vars_path }}" \
    --tags base_image -v | \
    /usr/bin/tee {{ openchami_x86_64_base_image_log_path }}
  async: 3600  # Set async timeout (e.g., 1 hour)
  poll: 0  # Non-blocking (continue the playbook without waiting for completion)
  register: base_image_build
  changed_when: true

- name: Wait for rhel-base image OpenCHAMI jobs to finish
  block:
    - name: Wait for rhel-base image OpenCHAMI jobs to finish
      ansible.builtin.async_status:
        jid: "{{ base_image_build.ansible_job_id }}"
      register: job_result
      until: job_result.finished
      retries: "{{ job_retry }}"
      delay: "{{ job_delay }}"
  rescue:
    - name: Fail the build if the base image build fails
      ansible.builtin.fail:
        msg: |
          {{ base_image_failure_msg }}

  always:
    - name: Remove generated base image vars file
      ansible.builtin.file:
        path: "{{ openchami_x86_64_base_image_vars_path }}"
        state: absent

    - name: Set openchami SELinux context
      ansible.builtin.command: chcon -R system_u:object_r:container_file_t:s0 "{{ oim_shared_path }}/omnia/openchami"
      changed_when: true
      delegate_to: oim
      connection: ssh
      failed_when: false


================================================
FILE: build_image_x86_64/roles/image_creation/tasks/build_compute_image.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Normalize build stream inputs
  ansible.builtin.set_fact:
    enable_build_stream: "{{ enable_build_stream | default(false) | bool }}"
    build_stream_job_id: "{{ build_stream_job_id | default('') }}"
    image_key: "{{ image_key | default('') }}"
    compute_image_suffix: ""

- name: Set compute image suffix when build stream inputs present
  ansible.builtin.set_fact:
    compute_image_suffix: "_{{ build_stream_job_id }}-{{ image_key | default('') }}"
  when:
    - enable_build_stream | bool
    - (build_stream_job_id | default('') | length) > 0
    - (image_key | default('') | length) > 0

- name: Create x86_64 compute image log files
  ansible.builtin.file:
    path: "{{ openchami_log_dir }}/{{ item.key }}{{ compute_image_suffix }}_compute_image.log"
    state: touch
    mode: "{{ dir_permissions_644 }}"
  loop: "{{ compute_images_dict | dict2items }}"
  loop_control:
    loop_var: item

- name: Render compute images templates
  ansible.builtin.template:
    src: "{{ openchami_compute_image_vars_template }}"
    dest: "{{ openchami_dir }}/{{ item.key }}{{ compute_image_suffix }}_compute_images.yaml"
    mode: "{{ dir_permissions_644 }}"
  vars:
    functional_group: "{{ item.value.functional_group }}"
    packages: "{{ item.value.packages }}"
    # Pre-compute image names to avoid undefined errors inside template
    base_compute_image_name: "{{ item.key }}{{ compute_image_suffix }}"
    rhel_base_compute_image_name: "rhel-{{ item.key }}{{ compute_image_suffix }}"
  loop: "{{ compute_images_dict | dict2items }}"
  loop_control:
    loop_var: item

- name: Invoking OpenCHAMI playbooks asynchronously for x86_64 compute image_build
  ansible.builtin.shell: |
    set -o pipefail
    ansible-playbook {{ openchami_clone_path }}/dell/podman-quadlets/image.yaml \
      -i {{ openchami_clone_path }}/dell/podman-quadlets/inventory -v \
      --extra-vars '@{{ openchami_dir }}/{{ item.key }}{{ compute_image_suffix }}_compute_images.yaml' \
      --tags compute_image -v | \
      /usr/bin/tee '{{ openchami_log_dir }}/{{ item.key }}{{ compute_image_suffix }}_compute_image.log'
  async: 3600   # Set async timeout (e.g., 1 hour)
  poll: 0   # Non-blocking (continue the playbook without waiting for completion)
  loop: "{{ compute_images_dict | dict2items }}"
  loop_control:
    loop_var: item
  register: compute_image_build_job
  changed_when: true

- name: Wait for all OpenCHAMI jobs to finish and remove generated compute images templates
  block:
    - name: Display image build jobs status
      ansible.builtin.debug:
        msg: "Waiting for image build: {{ item.item.key }} (Job ID: {{ item.ansible_job_id }})"
      loop: "{{ compute_image_build_job.results }}"
      loop_control:
        label: "{{ item.item.key }}"

    - name: Wait for all OpenCHAMI jobs to finish
      ansible.builtin.async_status:
        jid: "{{ item.ansible_job_id }}"
      register: job_result
      until: job_result.finished
      no_log: true
      retries: "{{ job_retry }}"
      delay: "{{ job_delay }}"
      loop: "{{ compute_image_build_job.results }}"
      loop_control:
        label: "Building: {{ item.item.key }}"

  rescue:
    - name: Identify failed image builds
      ansible.builtin.set_fact:
        failed_images: >
          {{ job_result.results
          | selectattr('failed', 'defined')
          | selectattr('failed', 'equalto', true)
          | map(attribute='item.item.key')
          | list }}
      when: job_result.results is defined

    - name: Build failure message list
      ansible.builtin.set_fact:
        failure_msg_list:
          - "x86_64 compute image build job did not complete successfully."
          - "Check logs at {{ openchami_log_dir }} for respective functional group for more details."
          - ""
          - "Failed images:"

    - name: Add failed image names to message
      ansible.builtin.set_fact:
        failure_msg_list: "{{ failure_msg_list + ['  - ' + item] }}"
      loop: "{{ failed_images | default(['Unknown - check all logs']) }}"

    - name: Add log paths section to message
      ansible.builtin.set_fact:
        failure_msg_list: "{{ failure_msg_list + ['', 'Check logs at ' + openchami_log_dir + ' for details:'] }}"

    - name: Add log file paths to message
      ansible.builtin.set_fact:
        failure_msg_list: "{{ failure_msg_list + ['  - ' + openchami_log_dir + '/' + item + log_suffix + '_compute_image.log'] }}"
      vars:
        log_suffix: "{{ compute_image_suffix }}"
      loop: "{{ failed_images | default([]) }}"

    - name: Display x86_64 compute image build failure details
      ansible.builtin.debug:
        msg: "{{ failure_msg_list }}"

    - name: Failed to build the x86_64 compute image
      ansible.builtin.fail:
        msg: "x86_64 compute image build failed. See details above."

  always:
    - name: Remove generated compute images templates
      ansible.builtin.file:
        path: "{{ openchami_dir }}/{{ item.key }}{{ compute_image_suffix }}_compute_images.yaml"
        state: absent
      loop: "{{ compute_images_dict | dict2items }}"
      loop_control:
        loop_var: item

    - name: Set openchami SELinux context
      ansible.builtin.command: chcon -R system_u:object_r:container_file_t:s0 "{{ oim_shared_path }}/omnia/openchami"
      changed_when: true
      delegate_to: oim
      connection: ssh
      failed_when: false


================================================
FILE: build_image_x86_64/roles/image_creation/tasks/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Include metadata vars
  ansible.builtin.include_vars: "{{ omnia_metadata_file }}"
  register: include_metadata
  no_log: true

- name: Include global variables from common folder
  ansible.builtin.include_vars: "{{ role_path }}/../../../common/vars/openchami_image_cmd.yml"
  register: ochami_image_global_vars

- name: Invoking x86_64 build base image playbook
  ansible.builtin.include_tasks: build_base_image.yml
  tags: base_image

- name: Invoking x86_64 build rhel compute image playbooks
  ansible.builtin.include_tasks: build_compute_image.yml
  tags: compute_image


================================================
FILE: build_image_x86_64/roles/image_creation/tasks/prepare_pulp_image.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# Load network specification
- name: Load network spec file
  ansible.builtin.include_vars:
    file: "{{ network_spec }}"
  register: include_network_spec
  no_log: true

- name: Fail if network spec cannot be loaded
  ansible.builtin.fail:
    msg: "{{ network_spec_syntax_fail_msg }} Error: {{ include_network_spec.message }}"
  when: include_network_spec is failed

# Parse network spec data
- name: Parse network spec
  ansible.builtin.set_fact:
    network_data: "{{ network_data | default({}) | combine({item.key: item.value}) }}"
  with_dict: "{{ Networks }}"

# Set PXE IP fact
- name: Set PXE IP fact
  ansible.builtin.set_fact:
    oim_pxe_ip: "{{ network_data.admin_network.primary_oim_admin_ip }}"
    cacheable: true

# Copy pulp certificate and update CA trust
- name: Copy pulp webserver certificate to anchors
  ansible.builtin.copy:
    src: "{{ pulp_webserver_cert_path }}"
    dest: "{{ anchors_path }}"
    mode: "{{ dir_permissions_644 }}"
  become: true

- name: Update CA trust
  ansible.builtin.command: update-ca-trust
  register: update_ca
  changed_when: false

- name: Build full Podman image path for x86_64
  ansible.builtin.set_fact:
    pulp_x86_image: "{{ oim_pxe_ip }}:2225/{{ pulp_x86_64_image_name }}"

- name: Pull and tag x86_64 image
  block:
    - name: Pull x86_64 image using Podman
      containers.podman.podman_image:
        name: "{{ pulp_x86_image }}"
        state: present
      register: pull_result
      retries: "{{ pull_image_retries }}"
      delay: "{{ pull_image_delay }}"
      until: pull_result is not failed
      changed_when: false

    - name: Tag pulled image for x86_64 build
      containers.podman.podman_tag:
        image: "{{ pulp_x86_image }}"
        target_names:
          - "{{ x86_64_local_tag }}"
      changed_when: false

  rescue:
    - name: Fail if Podman pull failed
      ansible.builtin.fail:
        msg: "Failed to pull image {{ pulp_x86_image }}."


================================================
FILE: build_image_x86_64/roles/image_creation/templates/base_image_template.j2
================================================
openchami_work_dir: "{{ openchami_work_dir }}"
rhel_base_image_name: "{{ rhel_x86_64_base_image_name }}"
rhel_base_image: "{{ oim_node_name }}/{{ rhel_x86_64_base_image_name }}"
cluster_name: "{{ oim_node_name }}"
cluster_domain: "{{ domain_name }}"
group_name: base
rhel_base_mounts: {{ ochami_mounts | join(' ') }}
image_build_name: {{ ochami_x86_64_image | join(' ') }}
rhel_base_command_options: {{ ochami_base_command | join(' ') }}
# Override OpenCHAMI defaults to ensure correct mount path
rhel_tag: "{{ rhel_tag }}"

rhel_repos:
{% for repo in rhel_x86_64_repos %}
  - { name: '{{ repo.name }}', url: '{{ repo.base_url }}', gpg: '{{ repo.gpg }}' }
{% endfor %}

base_image_packages:
{% for pkg in x86_64_base_image_packages %}
  - {{ pkg }}
{% endfor %}

base_image_commands:
{% for cmd in base_image_commands %}
  - {{ cmd | to_json }}
{% endfor %}


================================================
FILE: build_image_x86_64/roles/image_creation/templates/compute_images_templates.j2
================================================
openchami_work_dir: "{{ openchami_work_dir }}"
rhel_base_image: "{{ oim_node_name }}/{{ rhel_x86_64_base_image_name }}"
{% set image_name_suffix = compute_image_suffix | default('') %}
base_compute_image_name: "{{ item.key }}{{ image_name_suffix }}"
rhel_base_compute_image_name: "rhel-{{ item.key }}{{ image_name_suffix }}"
rhel_base_compute_image: "{{ oim_node_name }}/rhel-{{ item.key }}{{ image_name_suffix }}"
# S3 directory should stay stable (no job-id) while the filename will carry job-id via image name
s3_dir_name: "rhel-{{ item.key }}"
cluster_name: "{{ oim_node_name }}"
cluster_domain: "{{ domain_name }}"
group_name: "{{ item.key }}"
rhel_base_compute_mounts: --user 0 --privileged -v {{ oim_shared_path }}/omnia/pulp/settings/certs/pulp_webserver.crt:/etc/pki/ca-trust/source/anchors/pulp_webserver.crt:z -v {{ openchami_work_dir }}/images/{{ rhel_base_compute_image_name }}-{{ rhel_tag }}.yaml:/home/builder/config.yaml:z
image_build_name: {{ ochami_x86_64_image | join (' ') }}
rhel_base_compute_command_options: {{ ochami_base_command | join (' ') }}
minio_s3_username: "{{ minio_s3_username }}"
minio_s3_password: "{{ minio_s3_password }}"
{% set s3_prefix_suffix = '' %}
s3_prefix_suffix: "{{ s3_prefix_suffix }}"
# Override OpenCHAMI defaults to ensure correct mount path
rhel_tag: "{{ rhel_tag }}"

rhel_repos:
{% set rhel_repo = rhel_x86_64_repos %}
{% for repo in rhel_repo %}
  - { name: '{{ repo.name }}', url: '{{ repo.base_url }}', gpg: '{{ repo.gpg }}' }
{% endfor %}

base_compute_image_packages:
{% for pkg in packages %}
  - {{ pkg }}
{% endfor %}

# Commands for this role
{% set command_var = functional_group + '_compute_commands' %}
{% set commands_list = lookup('vars', command_var, default=[]) %}
base_compute_image_commands:
{% if commands_list | length > 0 %}
{% for cmd in commands_list %}
  - "{{ cmd }}"
{% endfor %}
{% else %}
  []
{% endif %}


================================================
FILE: build_image_x86_64/roles/image_creation/vars/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
pulp_x86_64_image_name: "dellhpcomniaaisolution/image-build-el10:1.1"
x86_64_local_tag: "x86_64-image-builder/ochami"
pull_image_retries: "3"
pull_image_delay: "10"
input_project_dir: "{{ hostvars['localhost']['input_project_dir'] }}"
omnia_metadata_file: "/opt/omnia/.data/oim_metadata.yml"
dir_permissions_644: "0644"
dir_permissions_755: "0755"
openchami_dir: "/opt/omnia/openchami"
openchami_clone_path: /opt/omnia/openchami/deployment-recipes
job_retry: "120"
job_delay: "30"
network_spec: "{{ input_project_dir }}/network_spec.yml"
pulp_webserver_cert_path: "/opt/omnia/pulp/settings/certs/pulp_webserver.crt"
anchors_path: "/etc/pki/ca-trust/source/anchors/pulp_webserver.crt"
openchami_work_dir: "{{ oim_shared_path }}/omnia/openchami/workdir"
ochami_mounts:
  - --user 0 --privileged
  - -v {{ oim_shared_path }}/omnia/pulp/settings/certs/pulp_webserver.crt:/etc/pki/ca-trust/source/anchors/pulp_webserver.crt:z
  - -v {{ openchami_work_dir }}/images/{{ rhel_x86_64_base_image_name }}-{{ rhel_tag }}.yaml:/home/builder/config.yaml:z
ochami_compute_mounts:
  - --user 0 --privileged
  - -v {{ oim_shared_path }}/omnia/pulp/settings/certs/pulp_webserver.crt:/etc/pki/ca-trust/source/anchors/pulp_webserver.crt:z
  - -v {{ openchami_work_dir }}/images/{{ rhel_base_compute_image_name }}-{{ rhel_tag }}.yaml:/home/builder/config.yaml:z

ochami_x86_64_image:
  - --entrypoint /bin/bash
  - "localhost/{{ x86_64_local_tag }}"
ochami_base_command:
  - -c 'update-ca-trust extract && image-build --config /home/builder/config.yaml --log-level DEBUG'

# build_base_image.yml
openchami_log_dir: /opt/omnia/log/openchami
openchami_x86_64_base_image_log_path: "{{ openchami_log_dir }}/x86_64_base_image.log"
openchami_base_image_vars_template: "{{ role_path }}/templates/base_image_template.j2"
openchami_x86_64_base_image_vars_path: "/opt/omnia/openchami/x86_64_base_image_template.yaml"
base_image_failure_msg: |
  Base x86_64 image build job failed or timed out.
  Check logs at path {{ openchami_x86_64_base_image_log_path }} for details.
compute_image_failure_msg: |
  x86_64 compute image build job did not complete successfully.
  Check logs at {{ openchami_log_dir }} for respective functional group for more details.

# build_compute_image.yml
openchami_compute_image_vars_template: "{{ role_path }}/templates/compute_images_templates.j2"
openchami_compute_image_vars_path: "/opt/omnia/openchami/compute_images_template.yaml"

network_spec_syntax_fail_msg: "Failed to load network_spec.yml due to syntax error"


================================================
FILE: build_stream/.gitignore
================================================
.venv
.vscode

/.idea/
/docs/build/
**/__pycache__/

================================================
FILE: build_stream/README.md
================================================
# Build Stream

**Build Stream** is a **RESTful API** (Representational State Transfer Application Programming Interface) service that orchestrates the creation and management of build jobs for the Omnia infrastructure platform. It provides a centralized interface for managing software catalog parsing, local repository creation, image building, and validation workflows.

## Architecture Overview

Build Stream follows a clean architecture pattern with clear separation of concerns:

- **API Layer** (`api/`): FastAPI routes and HTTP handling
- **Core Layer** (`core/`): Business logic, entities, and domain services  
- **Orchestrator Layer** (`orchestrator/`): Use cases that coordinate workflows
- **Infrastructure Layer** (`infra/`): External integrations and data persistence
- **Common Layer** (`common/`): Shared utilities and configuration

## High-Level Workflow

1. **Authentication**: **JWT** (JSON Web Token)-based authentication secures all API endpoints
2. **Job Creation**: Clients submit build requests through the jobs API
3. **Stage Processing**: Jobs are broken into stages (catalog parsing, local repo, build image, validation)
4. **Async Execution**: Stages execute asynchronously with result polling
5. **Artifact Management**: Build artifacts are stored and tracked throughout the process
6. **Audit Trail**: All operations are logged for traceability and compliance

## Configuration

Configuration is managed through:
- Environment variables for runtime settings
- `build_stream.ini` for artifact store configuration
- Vault integration for secure credential management
- Database configuration for persistent storage

Key configuration areas:
- Database connections (PostgreSQL)
- Artifact storage backend (file system or in-memory)
- Vault endpoints and authentication
- **CORS** (Cross-Origin Resource Sharing) and server settings

## Getting Started

### For Developers

**Primary Entry Points:**
- `main.py` - FastAPI application entry point
- `api/router.py` - API route aggregation
- `container.py` - Dependency injection setup

**Key Workflows:**
- [Jobs Management](./doc/jobs.md) - Job lifecycle and orchestration
- [Catalog Processing](./doc/catalog.md) - Software catalog parsing and role generation  
- [Local Repository](./doc/local_repo.md) - Local package repository creation
- [Image Building](./doc/build_image.md) - Container image build workflows
- [Validation](./doc/validation.md) - Input and output validation

**Development Setup:**
```bash
# Install dependencies
pip install -r requirements.txt
pip install -r requirements-dev.txt

# Set environment variables
export HOST=<host ip>
export PORT=<port>

# Run development server
uvicorn main:app --reload

# Run tests
pytest
```

**API Documentation:**
- See Omnia ReadTheDocs for complete API documentation

### Architecture Components

**Core Services:**
- **Job Service**: Manages job lifecycle and state transitions
- **Catalog Service**: Parses software catalogs and generates roles
- **Local Repo Service**: Creates and manages local repositories
- **Build Service**: Orchestrates container image builds
- **Validation Service**: Validates inputs and outputs

**Data Flow:**
1. Client requests → API routes → Use cases → Core services → Repositories
2. Async job processing with stage-based execution
3. Result polling and webhook notifications
4. Artifact storage and metadata tracking

**Security:**
- JWT token-based authentication
- Vault integration for secret management
- Role-based access control
- Audit logging for compliance

## Workflow Areas

Each major workflow area has dedicated documentation:

- **Jobs** - Job creation, monitoring, and lifecycle management
- **Catalog** - Software catalog parsing and role generation
- **Local Repo** - Local package repository setup and management  
- **Build Image** - Container image build orchestration
- **Validation** - Input validation and output verification

See the `doc/` directory for detailed workflow documentation.

## Dependencies

Build Stream uses FastAPI with the following key dependencies:
- FastAPI/Uvicorn for web framework
- SQLAlchemy for database **ORM** (Object-Relational Mapping)
- Dependency Injector for **IoC** (Inversion of Control) container
- PyJWT for **JWT** (JSON Web Token) authentication
- Ansible for infrastructure automation
- Vault client for secret management

## Support

For troubleshooting and development guidance:
1. Check the workflow-specific documentation in `doc/`
2. Review API logs for error details
3. Consult the audit trail for job execution history
4. Refer to the health check endpoint: `/health`


================================================
FILE: build_stream/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


================================================
FILE: build_stream/api/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


================================================
FILE: build_stream/api/auth/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""OAuth2 Authentication API module."""

from api.auth.routes import router

__all__ = ["router"]


================================================
FILE: build_stream/api/auth/jwt_handler.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""JWT token generation and validation utilities.

This module provides JWT handling following the OAuth2 Implementation Spec:
- Algorithm: RS256 (RSA signature with SHA-256)
- Token Lifetime: 3600 seconds (1 hour)
- Claims: iss, sub, aud, iat, exp, nbf, jti, scope, client_name
"""

import logging
import os
import uuid
from dataclasses import dataclass
from datetime import datetime, timedelta, timezone
from typing import List, Optional

import jwt
from jwt.exceptions import (
    DecodeError,
    ExpiredSignatureError,
    InvalidAudienceError,
    InvalidIssuerError,
    InvalidSignatureError,
)

logger = logging.getLogger(__name__)


class JWTHandlerError(Exception):
    """Base exception for JWT operations."""


class JWTCreationError(JWTHandlerError):
    """Exception raised when JWT creation fails."""


class JWTValidationError(JWTHandlerError):
    """Exception raised when JWT validation fails."""


class JWTExpiredError(JWTValidationError):
    """Exception raised when JWT has expired."""


class JWTInvalidSignatureError(JWTValidationError):
    """Exception raised when JWT signature is invalid."""


@dataclass
class JWTConfig:
    """Configuration for JWT token handling."""

    private_key_path: str
    public_key_path: str
    algorithm: str = "RS256"
    access_token_expire_minutes: int = 60
    issuer: str = "build-stream-api"
    audience: str = "build-stream-api"
    key_id: str = "build-stream-key-2026-01"

    @classmethod
    def from_env(cls) -> "JWTConfig":
        """Create JWTConfig from environment variables."""
        return cls(
            private_key_path=os.getenv(
                "JWT_PRIVATE_KEY_PATH", "/etc/omnia/keys/jwt_private.pem"
            ),
            public_key_path=os.getenv(
                "JWT_PUBLIC_KEY_PATH", "/etc/omnia/keys/jwt_public.pem"
            ),
            algorithm=os.getenv("JWT_ALGORITHM", "RS256"),
            access_token_expire_minutes=int(
                os.getenv("JWT_ACCESS_TOKEN_EXPIRE_MINUTES", "60")
            ),
            issuer=os.getenv("JWT_ISSUER", "build-stream-api"),
            audience=os.getenv("JWT_AUDIENCE", "build-stream-api"),
            key_id=os.getenv("JWT_KEY_ID", "build-stream-key-2026-01"),
        )


@dataclass
class TokenData:
    """Data class representing decoded JWT token claims."""

    client_id: str
    client_name: str
    scopes: List[str]
    issued_at: datetime
    expires_at: datetime
    token_id: str


class JWTHandler:
    """Handler for JWT token creation and validation."""

    def __init__(self, config: Optional[JWTConfig] = None):
        """Initialize the JWT handler.

        Args:
            config: Optional JWTConfig instance. Creates from env if not provided.
        """
        self.config = config or JWTConfig.from_env()
        self._private_key: Optional[str] = None
        self._public_key: Optional[str] = None

    def _load_private_key(self) -> str:
        """Load the RSA private key for signing tokens.

        Returns:
            Private key as string.

        Raises:
            JWTCreationError: If key file cannot be read.
        """
        if self._private_key is None:
            try:
                with open(self.config.private_key_path, "r", encoding="utf-8") as f:
                    self._private_key = f.read()
            except FileNotFoundError:
                logger.error("JWT private key not found: %s", self.config.private_key_path)
                raise JWTCreationError(
                    f"JWT private key not found: {self.config.private_key_path}"
                ) from None
            except IOError:
                logger.error("Failed to read JWT private key")
                raise JWTCreationError("Failed to read JWT private key") from None
        return self._private_key

    def _load_public_key(self) -> str:
        """Load the RSA public key for verifying tokens.

        Returns:
            Public key as string.

        Raises:
            JWTValidationError: If key file cannot be read.
        """
        if self._public_key is None:
            try:
                with open(self.config.public_key_path, "r", encoding="utf-8") as f:
                    self._public_key = f.read()
            except FileNotFoundError:
                logger.error("JWT public key not found: %s", self.config.public_key_path)
                raise JWTValidationError(
                    f"JWT public key not found: {self.config.public_key_path}"
                ) from None
            except IOError:
                logger.error("Failed to read JWT public key")
                raise JWTValidationError("Failed to read JWT public key") from None
        return self._public_key

    def create_access_token(
        self,
        client_id: str,
        client_name: str,
        scopes: List[str],
    ) -> tuple[str, int]:
        """Create a JWT access token.

        Args:
            client_id: The client identifier (becomes 'sub' claim).
            client_name: Human-readable client name.
            scopes: List of granted scopes.

        Returns:
            Tuple of (access_token, expires_in_seconds).

        Raises:
            JWTCreationError: If token creation fails.
        """
        now = datetime.now(timezone.utc)
        expires_delta = timedelta(minutes=self.config.access_token_expire_minutes)
        expires_at = now + expires_delta
        token_id = str(uuid.uuid4())

        claims = {
            "iss": self.config.issuer,
            "sub": client_id,
            "aud": self.config.audience,
            "iat": int(now.timestamp()),
            "exp": int(expires_at.timestamp()),
            "nbf": int(now.timestamp()),
            "jti": token_id,
            "scope": " ".join(scopes),
            "client_name": client_name,
        }

        headers = {
            "alg": self.config.algorithm,
            "typ": "JWT",
            "kid": self.config.key_id,
        }

        try:
            private_key = self._load_private_key()
            token = jwt.encode(
                claims,
                private_key,
                algorithm=self.config.algorithm,
                headers=headers,
            )
            logger.info("Access token created for client: %s", client_id[:8] + "...")
            return token, int(expires_delta.total_seconds())
        except Exception:
            logger.error("Failed to create access token")
            raise JWTCreationError("Failed to create access token") from None

    def validate_token(self, token: str) -> TokenData:
        """Validate a JWT access token and extract claims.

        Args:
            token: The JWT token string.

        Returns:
            TokenData with decoded claims.

        Raises:
            JWTExpiredError: If token has expired.
            JWTInvalidSignatureError: If signature is invalid.
            JWTValidationError: If token is otherwise invalid.
        """
        try:
            public_key = self._load_public_key()
            payload = jwt.decode(
                token,
                public_key,
                algorithms=[self.config.algorithm],
                audience=self.config.audience,
                issuer=self.config.issuer,
            )

            return TokenData(
                client_id=payload["sub"],
                client_name=payload.get("client_name", ""),
                scopes=payload.get("scope", "").split(),
                issued_at=datetime.fromtimestamp(payload["iat"], tz=timezone.utc),
                expires_at=datetime.fromtimestamp(payload["exp"], tz=timezone.utc),
                token_id=payload.get("jti", ""),
            )
        except ExpiredSignatureError:
            logger.warning("Token has expired")
            raise JWTExpiredError("Token has expired") from None
        except (InvalidAudienceError, InvalidIssuerError):
            logger.warning("Invalid token claims")
            raise JWTValidationError("Invalid token claims") from None
        except InvalidSignatureError:
            logger.warning("Invalid token signature")
            raise JWTInvalidSignatureError("Invalid token signature") from None
        except DecodeError:
            logger.warning("Invalid token format")
            raise JWTValidationError("Invalid token format") from None
        except Exception:
            logger.error("Unexpected error validating token")
            raise JWTValidationError("Token validation failed") from None


================================================
FILE: build_stream/api/auth/password_handler.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Password hashing utilities using Argon2id algorithm.

This module provides secure password hashing following the OAuth2 Implementation Spec:
- Algorithm: Argon2id
- Memory Cost: 65536 KB (64 MB)
- Time Cost: 3 iterations
- Parallelism: 4 threads
- Salt Length: 16 bytes
- Hash Length: 32 bytes
"""

import logging
import secrets
from typing import Tuple

from argon2 import PasswordHasher, Type
from argon2.exceptions import InvalidHashError, VerifyMismatchError

logger = logging.getLogger(__name__)

_hasher = PasswordHasher(
    time_cost=3,
    memory_cost=65536,
    parallelism=4,
    hash_len=32,
    salt_len=16,
    type=Type.ID,
)


def hash_password(password: str) -> str:
    """Hash a password using Argon2id.

    Args:
        password: The plaintext password to hash.

    Returns:
        The hashed password in Argon2 PHC string format.
    """
    return _hasher.hash(password)


def verify_password(password: str, hashed: str) -> bool:
    """Verify a password against its hash.

    Args:
        password: The plaintext password to verify.
        hashed: The Argon2 hash to verify against.

    Returns:
        True if password matches, False otherwise.
    """
    try:
        _hasher.verify(hashed, password)
        return True
    except (VerifyMismatchError, InvalidHashError):
        return False


def check_needs_rehash(hashed: str) -> bool:
    """Check if a hash needs to be rehashed due to parameter changes.

    Args:
        hashed: The existing hash to check.

    Returns:
        True if rehashing is recommended, False otherwise.
    """
    try:
        return _hasher.check_needs_rehash(hashed)
    except InvalidHashError:
        return True


def generate_client_id() -> str:
    """Generate a unique client ID.

    Returns:
        A client ID with 'bld_' prefix followed by 32 hex characters.
    """
    return f"bld_{secrets.token_hex(16)}"


def generate_client_secret() -> str:
    """Generate a cryptographically secure client secret.

    Returns:
        A client secret with 'bld_s_' prefix followed by URL-safe base64 characters.
    """
    return f"bld_s_{secrets.token_urlsafe(32)}"


def generate_credentials() -> Tuple[str, str, str]:
    """Generate a new client ID, secret, and hashed secret.

    Returns:
        Tuple of (client_id, client_secret, hashed_secret).
        The client_secret is the plaintext to return to the client.
        The hashed_secret is what should be stored in the vault.
    """
    client_id = generate_client_id()
    client_secret = generate_client_secret()
    hashed_secret = hash_password(client_secret)


    return client_id, client_secret, hashed_secret


================================================
FILE: build_stream/api/auth/routes.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""FastAPI routes for OAuth2 authentication endpoints."""

from typing import Annotated

from fastapi import APIRouter, Depends, HTTPException, status
from fastapi.security import HTTPBasic, HTTPBasicCredentials

from api.logging_utils import log_auth_info
from api.vault_client import VaultError
from api.auth.schemas import (
    AuthErrorResponse,
    ClientRegistrationRequest,
    ClientRegistrationResponse,
    TokenRequest,
    TokenResponse,
)
from api.auth.service import (
    AuthService,
    AuthenticationError,
    ClientDisabledError,
    ClientExistsError,
    InvalidClientError,
    InvalidScopeError,
    MaxClientsReachedError,
    RegistrationDisabledError,
    TokenCreationError,
)

router = APIRouter(prefix="/auth", tags=["Authentication"])

security = HTTPBasic()


def get_auth_service() -> AuthService:
    """Provide AuthService instance for dependency injection."""
    return AuthService()


def _verify_basic_auth(
    credentials: Annotated[HTTPBasicCredentials, Depends(security)],
    auth_service: Annotated[AuthService, Depends(get_auth_service)],
) -> HTTPBasicCredentials:
    """Verify Basic Authentication credentials for registration.

    Args:
        credentials: HTTP Basic Auth credentials from request.
        auth_service: AuthService instance.

    Returns:
        Validated credentials.

    Raises:
        HTTPException: If authentication fails.
    """
    try:
        auth_service.verify_registration_credentials(
            credentials.username,
            credentials.password,
        )
        log_auth_info("info", "Register auth: credentials verified")
        return credentials
    except AuthenticationError:
        log_auth_info("error", "Register auth: invalid credentials, status=401", end_section=True)
        raise HTTPException(
            status_code=status.HTTP_401_UNAUTHORIZED,
            detail={
                "error": "invalid_credentials",
                "error_description": "Invalid Basic Auth credentials",
            },
            headers={"WWW-Authenticate": "Basic"},
        ) from None
    except RegistrationDisabledError:
        log_auth_info("warning", "Register auth: registration disabled, status=503", end_section=True)
        raise HTTPException(
            status_code=status.HTTP_503_SERVICE_UNAVAILABLE,
            detail={
                "error": "service_unavailable",
                "error_description": "Registration service is not available",
            },
        ) from None
    except Exception:
        log_auth_info("error", "Register auth: unexpected error during credential verification", exc_info=True, end_section=True)
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail={
                "error": "server_error",
                "error_description": "An unexpected error occurred",
            },
        ) from None


@router.post(
    "/register",
    response_model=ClientRegistrationResponse,
    status_code=status.HTTP_201_CREATED,
    summary="Register a new OAuth client",
    description="Register a new OAuth client using HTTP Basic Authentication. "
    "Returns client_id and client_secret which must be securely stored.",
    responses={
        201: {
            "description": "Client registered successfully",
            "model": ClientRegistrationResponse,
        },
        400: {
            "description": "Invalid request (missing or malformed request body)",
            "model": AuthErrorResponse,
        },
        401: {
            "description": "Invalid Basic Auth credentials",
            "model": AuthErrorResponse,
        },
        409: {
            "description": "Client name already registered",
            "model": AuthErrorResponse,
        },
        422: {
            "description": "Validation error (invalid field values)",
            "model": AuthErrorResponse,
        },
        429: {
            "description": "Rate limit exceeded",
            "model": AuthErrorResponse,
        },
        500: {
            "description": "Internal server error",
            "model": AuthErrorResponse,
        },
        503: {
            "description": "Registration service unavailable",
            "model": AuthErrorResponse,
        },
    },
)
async def register_client(
    request: ClientRegistrationRequest,
    credentials: Annotated[HTTPBasicCredentials, Depends(_verify_basic_auth)],  # pylint: disable=unused-argument
    auth_service: Annotated[AuthService, Depends(get_auth_service)],
) -> ClientRegistrationResponse:
    """Register a new OAuth client.

    This endpoint requires HTTP Basic Authentication with pre-configured
    registration credentials. On success, returns client_id and client_secret
    which the client must securely store.

    **Important:** The client_secret is shown only once during registration.

    Args:
        request: Client registration request containing client_name and optional fields.
        credentials: Validated Basic Auth credentials (injected by dependency).
        auth_service: AuthService instance (injected by dependency).

    Returns:
        ClientRegistrationResponse with client_id and client_secret.

    Raises:
        HTTPException: With appropriate status code on failure.
    """
    log_auth_info(
        "info",
        f"Register request: client_name={request.client_name}",
    )

    try:
        registered_client = auth_service.register_client(
            client_name=request.client_name,
            description=request.description,
            allowed_scopes=request.allowed_scopes,
        )

        log_auth_info(
            "info",
            f"Register success: client_name={request.client_name}, "
            f"client_id={registered_client.client_id}, "
            f"scopes={registered_client.allowed_scopes}, status=201",
            end_section=True,
        )

        return ClientRegistrationResponse(
            client_id=registered_client.client_id,
            client_secret=registered_client.client_secret,
            client_name=registered_client.client_name,
            allowed_scopes=registered_client.allowed_scopes,
            created_at=registered_client.created_at,
            expires_at=registered_client.expires_at,
        )

    except MaxClientsReachedError as e:
        log_auth_info("warning", f"Register failed: client_name={request.client_name}, reason=max_clients_reached, status=409", end_section=True)
        raise HTTPException(
            status_code=status.HTTP_409_CONFLICT,
            detail={
                "error": "max_clients_reached",
                "error_description": "Maximum number of clients (1) already registered"
            },
        ) from None
    except ClientExistsError:
        log_auth_info("warning", f"Register failed: client_name={request.client_name}, reason=client_exists, status=409", end_section=True)
        raise HTTPException(
            status_code=status.HTTP_409_CONFLICT,
            detail={
                "error": "client_exists",
                "error_description": "Client with this name already exists",
            },
        ) from None
    except VaultError:
        log_auth_info("error", f"Register failed: client_name={request.client_name}, reason=vault_error, status=500", end_section=True)
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail={
                "error": "server_error",
                "error_description": "Failed to store client credentials",
            },
        ) from None
    except Exception as e:
        log_auth_info(
            "error",
            f"Register failed: client_name={request.client_name}, reason=unexpected_error, status=500",
            exc_info=True,
            end_section=True,
        )
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail={
                "error": "server_error",
                "error_description": "An unexpected error occurred",
            },
        ) from None


@router.post(
    "/token",
    response_model=TokenResponse,
    status_code=status.HTTP_200_OK,
    summary="Request an access token",
    description="Exchange client credentials for a JWT access token using "
    "OAuth2 client_credentials grant type.",
    responses={
        200: {
            "description": "Token generated successfully",
            "model": TokenResponse,
        },
        400: {
            "description": "Invalid request (unsupported grant type, invalid scope)",
            "model": AuthErrorResponse,
        },
        401: {
            "description": "Invalid client credentials",
            "model": AuthErrorResponse,
        },
        403: {
            "description": "Client account is disabled",
            "model": AuthErrorResponse,
        },
        500: {
            "description": "Internal server error",
            "model": AuthErrorResponse,
        },
    },
)
async def request_token(
    request: Annotated[TokenRequest, Depends()],
    auth_service: Annotated[AuthService, Depends(get_auth_service)],
) -> TokenResponse:
    """Request an OAuth2 access token.

    This endpoint implements the OAuth2 client_credentials grant type.
    Clients must provide their client_id and client_secret to receive
    a JWT access token.

    Args:
        request: Token request containing grant_type, client_id, client_secret, and optional scope.
        auth_service: AuthService instance (injected by dependency).

    Returns:
        TokenResponse with access_token, token_type, expires_in, and scope.

    Raises:
        HTTPException: With appropriate status code on failure.
    """
    client_id_short = request.client_id if request.client_id else "None"
    log_auth_info(
        "info",
        f"Token request: client_id={client_id_short}, "
        f"grant_type={request.grant_type}, scope={request.scope}",
    )

    if request.client_id is None or request.client_secret is None:
        log_auth_info("warning", f"Token failed: client_id={client_id_short}, reason=missing_credentials, status=400", end_section=True)
        raise HTTPException(
            status_code=status.HTTP_400_BAD_REQUEST,
            detail={
                "error": "invalid_request",
                "error_description": "client_id and client_secret are required",
            },
        )

    try:
        token_result = auth_service.generate_token(
            client_id=request.client_id,
            client_secret=request.client_secret,
            requested_scope=request.scope,
        )

        log_auth_info(
            "info",
            f"Token success: client_id={client_id_short}, "
            f"scope={token_result.scope}, "
            f"expires_in={token_result.expires_in}s, status=200",
            end_section=True,
        )

        return TokenResponse(
            access_token=token_result.access_token,
            token_type=token_result.token_type,
            expires_in=token_result.expires_in,
            scope=token_result.scope,
        )

    except InvalidClientError:
        log_auth_info("warning", f"Token failed: client_id={client_id_short}, reason=invalid_client, status=401", end_section=True)
        raise HTTPException(
            status_code=status.HTTP_401_UNAUTHORIZED,
            detail={
                "error": "invalid_client",
                "error_description": "Client authentication failed",
            },
        ) from None

    except ClientDisabledError:
        log_auth_info("warning", f"Token failed: client_id={client_id_short}, reason=client_disabled, status=403", end_section=True)
        raise HTTPException(
            status_code=status.HTTP_403_FORBIDDEN,
            detail={
                "error": "client_disabled",
                "error_description": "Client account is disabled",
            },
        ) from None

    except InvalidScopeError as e:
        log_auth_info("warning", f"Token failed: client_id={client_id_short}, reason=invalid_scope, detail={e}, status=400", end_section=True)
        raise HTTPException(
            status_code=status.HTTP_400_BAD_REQUEST,
            detail={
                "error": "invalid_scope",
                "error_description": str(e),
            },
        ) from None

    except TokenCreationError:
        log_auth_info("error", f"Token failed: client_id={client_id_short}, reason=token_creation_error, status=500", end_section=True)
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail={
                "error": "server_error",
                "error_description": "Failed to create access token",
            },
        ) from None

    except Exception:
        log_auth_info("error", f"Token failed: client_id={client_id_short}, reason=unexpected_error, status=500", exc_info=True, end_section=True)
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail={
                "error": "server_error",
                "error_description": "An unexpected error occurred",
            },
        ) from None


================================================
FILE: build_stream/api/auth/schemas.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Pydantic schemas for OAuth2 authentication API request and response models."""

import re
from datetime import datetime
from enum import Enum
from typing import List, Optional

from fastapi import Form, HTTPException, status
from pydantic import BaseModel, Field, field_validator


class ClientRegistrationRequest(BaseModel):  # pylint: disable=too-few-public-methods
    """Request model for client registration."""

    client_name: str = Field(
        ...,
        min_length=1,
        max_length=64,
        description="Unique identifier for the client (alphanumeric, hyphens, max 64 chars)",
    )
    description: Optional[str] = Field(
        default=None,
        max_length=256,
        description="Human-readable description (max 256 chars)",
    )
    allowed_scopes: Optional[List[str]] = Field(
        default=None,
        description="Requested OAuth scopes (default: ['catalog:read'])",
    )

    @field_validator("client_name")
    @classmethod
    def validate_client_name(cls, v: str) -> str:
        """Validate client_name contains only allowed characters."""
        if not re.match(r"^[a-zA-Z0-9][a-zA-Z0-9_-]*$", v):
            raise ValueError(
                "client_name must start with alphanumeric and contain only "
                "alphanumeric characters, hyphens, and underscores"
            )
        return v

    @field_validator("allowed_scopes")
    @classmethod
    def validate_scopes(cls, v: Optional[List[str]]) -> Optional[List[str]]:
        """Validate that requested scopes are valid."""
        valid_scopes = {"catalog:read", "catalog:write", "admin:read", "admin:write", "job:read", "job:write"}
        if v is not None:
            for scope in v:
                if scope not in valid_scopes:
                    raise ValueError(f"Invalid scope: {scope}")
        return v


class ClientRegistrationResponse(BaseModel):  # pylint: disable=too-few-public-methods
    """Response model for successful client registration."""

    client_id: str = Field(
        ...,
        description="Unique client identifier (prefix: bld_)",
    )
    client_secret: str = Field(
        ...,
        description="Client secret (prefix: bld_s_) - shown only once",
    )
    client_name: str = Field(
        ...,
        description="The registered client name",
    )
    allowed_scopes: List[str] = Field(
        ...,
        description="Granted OAuth scopes",
    )
    created_at: datetime = Field(
        ...,
        description="Registration timestamp",
    )
    expires_at: Optional[datetime] = Field(
        default=None,
        description="Credential expiration (null = no expiry)",
    )

    model_config = {
        "json_schema_extra": {
            "examples": [
                {
                    "client_id": "bld_<32_hex_characters>",
                    #"client_secret": "", #Commented out for security
                    "client_name": "example-client-name",
                    "allowed_scopes": ["catalog:read", "catalog:write"],
                    "created_at": "2026-01-21T07:31:00Z",
                    "expires_at": None,
                }
            ]
        }
    }


class AuthErrorResponse(BaseModel):  # pylint: disable=too-few-public-methods
    """OAuth2 error response model following RFC 6749."""

    error: str = Field(
        ...,
        description="Error code (machine-readable)",
    )
    error_description: str = Field(
        ...,
        description="Human-readable error description",
    )

    model_config = {
        "json_schema_extra": {
            "examples": [
                {
                    "error": "invalid_credentials",
                    "error_description": "Invalid Basic Auth credentials",
                },
                {
                    "error": "client_exists",
                    "error_description": "Client name already registered",
                },
            ]
        }
    }


class GrantType(str, Enum):
    """Supported OAuth2 grant types."""

    CLIENT_CREDENTIALS = "client_credentials"


class TokenRequest:  # pylint: disable=too-few-public-methods
    """Request model for OAuth2 token endpoint (application/x-www-form-urlencoded)."""

    def __init__(
        self,
        grant_type: GrantType = Form(..., description="OAuth2 grant type"),
        client_id: Optional[str] = Form(default=None, description="Client identifier"),
        client_secret: Optional[str] = Form(default=None, description="Client secret"),
        scope: Optional[str] = Form(default=None, description="Requested scopes"),
    ):
        """Initialize token request from form data."""
        self.grant_type = grant_type
        self.client_id = self._validate_client_id(client_id)
        self.client_secret = self._validate_client_secret(client_secret)
        self.scope = scope

    @staticmethod
    def _validate_client_id(v: Optional[str]) -> Optional[str]:
        """Validate client_id format if provided."""
        if v is not None and not v.startswith("bld_"):
            raise HTTPException(
                status_code=status.HTTP_422_UNPROCESSABLE_CONTENT,
                detail=[{
                    "type": "value_error",
                    "loc": ["body", "client_id"],
                    "msg": "client_id must start with 'bld_' prefix",
                }],
            )
        return v

    @staticmethod
    def _validate_client_secret(v: Optional[str]) -> Optional[str]:
        """Validate client_secret format if provided."""
        if v is not None and not v.startswith("bld_s_"):
            raise HTTPException(
                status_code=status.HTTP_422_UNPROCESSABLE_CONTENT,
                detail=[{
                    "type": "value_error",
                    "loc": ["body", "client_secret"],
                    "msg": "client_secret must start with 'bld_s_' prefix",
                }],
            )
        return v


class TokenResponse(BaseModel):  # pylint: disable=too-few-public-methods
    """Response model for successful token generation (RFC 6749 compliant)."""

    access_token: str = Field(
        ...,
        description="JWT access token",
    )
    token_type: str = Field(
        default="Bearer",
        description="Token type (always 'Bearer')",
    )
    expires_in: int = Field(
        ...,
        description="Token lifetime in seconds",
    )
    scope: str = Field(
        ...,
        description="Granted scopes (space-separated)",
    )

    model_config = {
        "json_schema_extra": {
            "examples": [
                {
                    "access_token": "eyJhbGciOiJSUzI1NiIsInR5cCI6IkpXVCJ9...",
                    "token_type": "Bearer",
                    "expires_in": 3600,
                    "scope": "catalog:read catalog:write",
                }
            ]
        }
    }


================================================
FILE: build_stream/api/auth/service.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Authentication service for OAuth2 client management."""

import os
from dataclasses import dataclass
from datetime import datetime, timezone
from typing import List, Optional

from api.auth.jwt_handler import JWTHandler, JWTCreationError
from api.auth.password_handler import generate_credentials, verify_password
from api.logging_utils import log_auth_info
from api.vault_client import VaultClient, VaultDecryptError, VaultNotFoundError
from core.exceptions import (
    ClientDisabledError,
    InvalidClientError,
    InvalidScopeError,
    TokenCreationError,
)

DEFAULT_SCOPES = ["catalog:read"]


class AuthenticationError(Exception):
    """Exception raised when authentication fails."""


class ClientExistsError(Exception):
    """Exception raised when client name already exists."""


class MaxClientsReachedError(Exception):
    """Exception raised when maximum number of clients is already registered."""


class RegistrationDisabledError(Exception):
    """Exception raised when registration is disabled or misconfigured."""


@dataclass
class RegisteredClient:
    """Data class representing a registered OAuth client."""

    client_id: str
    client_secret: str
    client_name: str
    allowed_scopes: List[str]
    created_at: datetime
    expires_at: Optional[datetime] = None


@dataclass
class TokenResult:
    """Data class representing a token generation result."""

    access_token: str
    token_type: str
    expires_in: int
    scope: str


class AuthService:
    """Service for handling OAuth2 authentication operations."""

    def __init__(
        self,
        vault_client: Optional[VaultClient] = None,
        jwt_handler: Optional[JWTHandler] = None,
    ):
        """Initialize the authentication service.

        Args:
            vault_client: Optional VaultClient instance. Creates default if not provided.
            jwt_handler: Optional JWTHandler instance. Creates default if not provided.
        """
        self.vault_client = vault_client or VaultClient()
        self.jwt_handler = jwt_handler or JWTHandler()
        self._registration_username = os.getenv("AUTH_REGISTRATION_USERNAME")

    def verify_registration_credentials(self, username: str, password: str) -> bool:
        """Verify the Basic Auth credentials for registration endpoint.

        Args:
            username: The provided username.
            password: The provided password.

        Returns:
            True if credentials are valid.

        Raises:
            AuthenticationError: If credentials are invalid.
            RegistrationDisabledError: If registration is not configured.
        """
        try:
            auth_config = self.vault_client.get_auth_config()
        except VaultNotFoundError:
            raise RegistrationDisabledError(
                "Registration is not configured"
            ) from None
        except VaultDecryptError:
            raise RegistrationDisabledError(
                "Registration configuration error"
            ) from None

        registration_config = auth_config.get("auth_registration", {})
        stored_username = registration_config.get("username")
        stored_password_hash = registration_config.get("password_hash")

        if not stored_username or not stored_password_hash:
            raise RegistrationDisabledError(
                "Registration is not configured"
            ) from None

        if username != stored_username:
            raise AuthenticationError("Invalid credentials")

        if not verify_password(password, stored_password_hash):
            raise AuthenticationError("Invalid credentials")

        return True

    def register_client(
        self,
        client_name: str,
        description: Optional[str] = None,
        allowed_scopes: Optional[List[str]] = None,
    ) -> RegisteredClient:
        """Register a new OAuth client.

        Args:
            client_name: Unique name for the client.
            description: Optional description of the client.
            allowed_scopes: List of OAuth scopes to grant.

        Returns:
            RegisteredClient with credentials (secret shown only once).

        Raises:
            ClientExistsError: If client_name is already registered.
            MaxClientsReachedError: If maximum client limit (1) is reached.
            VaultError: If vault operations fail.
        """
        active_count = self.vault_client.get_active_client_count()
        if active_count >= 1:
            raise MaxClientsReachedError(
                "Maximum number of clients (1) already registered. "
                "Only one active client is supported."
            )

        if self.vault_client.client_exists(client_name):
            raise ClientExistsError("Client already exists")

        scopes = allowed_scopes if allowed_scopes else DEFAULT_SCOPES
        client_id, client_secret, hashed_secret = generate_credentials()
        created_at = datetime.now(timezone.utc)

        client_data = {
            "client_name": client_name,
            "client_secret_hash": hashed_secret,
            "description": description,
            "allowed_scopes": scopes,
            "created_at": created_at.isoformat(),
            "is_active": True,
        }

        self.vault_client.save_oauth_client(client_id, client_data)

        return RegisteredClient(
            client_id=client_id,
            client_secret=client_secret,
            client_name=client_name,
            allowed_scopes=scopes,
            created_at=created_at,
            expires_at=None,
        )

    def verify_client_credentials(
        self,
        client_id: str,
        client_secret: str,
    ) -> dict:
        """Verify client credentials for token endpoint.

        Args:
            client_id: The client identifier.
            client_secret: The client secret.

        Returns:
            Client data dictionary if credentials are valid.

        Raises:
            InvalidClientError: If client_id is unknown or secret is invalid.
            ClientDisabledError: If client account is disabled.
        """
        try:
            oauth_clients = self.vault_client.get_oauth_clients()
        except (VaultNotFoundError, VaultDecryptError):
            log_auth_info("error", "Failed to load OAuth clients from vault")
            # Ensure no exception details are exposed
            raise InvalidClientError("Client authentication failed") from None

        if client_id not in oauth_clients:
            log_auth_info("warning", f"Unknown client_id attempted authentication: {client_id}")
            raise InvalidClientError("Client authentication failed")

        client_data = oauth_clients[client_id]

        if not client_data.get("is_active", False):
            log_auth_info("warning", f"Disabled client attempted token request: {client_id}")
            raise ClientDisabledError("Client account is disabled")

        stored_hash = client_data.get("client_secret_hash")
        if not stored_hash or not verify_password(client_secret, stored_hash):
            log_auth_info("warning", f"Invalid client secret provided: {client_id}")
            raise InvalidClientError("Client authentication failed")

        log_auth_info("info", f"Client credentials verified successfully: {client_id}")
        return client_data

    def generate_token(
        self,
        client_id: str,
        client_secret: str,
        requested_scope: Optional[str] = None,
    ) -> TokenResult:
        """Generate a JWT access token for authenticated client.

        Args:
            client_id: The client identifier.
            client_secret: The client secret.
            requested_scope: Optional space-separated list of requested scopes.

        Returns:
            TokenResult with access token and metadata.

        Raises:
            InvalidClientError: If client credentials are invalid.
            ClientDisabledError: If client account is disabled.
            InvalidScopeError: If requested scope is not allowed.
            TokenCreationError: If token creation fails.
        """
        client_data = self.verify_client_credentials(client_id, client_secret)

        allowed_scopes = client_data.get("allowed_scopes", DEFAULT_SCOPES)
        client_name = client_data.get("client_name", "")

        if requested_scope:
            requested_scopes = requested_scope.split()
            for scope in requested_scopes:
                if scope not in allowed_scopes:
                    log_auth_info(
                        "warning",
                        f"Client requested unauthorized scope: {scope}, client_id={client_id}",
                    )
                    raise InvalidScopeError(f"Scope '{scope}' is not allowed for this client")
            granted_scopes = requested_scopes
        else:
            granted_scopes = allowed_scopes

        try:
            access_token, expires_in = self.jwt_handler.create_access_token(
                client_id=client_id,
                client_name=client_name,
                scopes=granted_scopes,
            )
        except JWTCreationError:
            log_auth_info("error", f"Failed to create access token: {client_id}")
            raise TokenCreationError("Failed to create access token") from None

        log_auth_info("info", f"Access token generated successfully: {client_id}")

        return TokenResult(
            access_token=access_token,
            token_type="Bearer",
            expires_in=expires_in,
            scope=" ".join(granted_scopes),
        )


================================================
FILE: build_stream/api/build_image/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Build Image API module."""

from api.build_image.routes import router

__all__ = ["router"]


================================================
FILE: build_stream/api/build_image/dependencies.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""FastAPI dependency providers for Build Image API."""

from typing import Optional

from fastapi import Depends, Header, HTTPException, status
from sqlalchemy.orm import Session

from api.dependencies import (
    get_db_session,
    _create_sql_job_repo,
    _create_sql_stage_repo,
    _create_sql_audit_repo,
    _get_container,
    _ENV,
)
from core.jobs.value_objects import ClientId, CorrelationId
from orchestrator.build_image.use_cases import CreateBuildImageUseCase


def _get_container():
    """Lazy import of container to avoid circular imports."""
    from container import container  # pylint: disable=import-outside-toplevel
    return container


def get_create_build_image_use_case(
    db_session: Session = Depends(get_db_session),
) -> CreateBuildImageUseCase:
    """Provide create build image use case with shared session in prod."""
    if _ENV == "prod":
        container = _get_container()
        return CreateBuildImageUseCase(
            job_repo=_create_sql_job_repo(db_session),
            stage_repo=_create_sql_stage_repo(db_session),
            audit_repo=_create_sql_audit_repo(db_session),
            config_service=container.build_image_config_service(),
            queue_service=container.playbook_queue_request_service(),
            inventory_repo=container.input_repository(),
            uuid_generator=container.uuid_generator(),
        )
    return _get_container().create_build_image_use_case()


def get_build_image_correlation_id(
    x_correlation_id: Optional[str] = Header(
        default=None,
        alias="X-Correlation-Id",
        description="Request tracing ID",
    ),
) -> CorrelationId:
    """Return provided correlation ID or generate one."""
    generator = _get_container().uuid_generator()
    if x_correlation_id:
        try:
            return CorrelationId(x_correlation_id)
        except ValueError:
            pass

    generated_id = generator.generate()
    return CorrelationId(str(generated_id))


================================================
FILE: build_stream/api/build_image/routes.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""FastAPI routes for build image stage operations."""

from datetime import datetime, timezone
from typing import Annotated

from fastapi import APIRouter, Depends, HTTPException, status

from api.build_image.dependencies import (
    get_create_build_image_use_case,
    get_build_image_correlation_id,
)
from api.dependencies import verify_token, require_job_write
from api.build_image.schemas import (
    CreateBuildImageRequest,
    CreateBuildImageResponse,
    BuildImageErrorResponse,
)
from api.logging_utils import log_secure_info
from core.build_image.exceptions import (
    BuildImageDomainError,
    InvalidArchitectureError,
    InvalidImageKeyError,
    InvalidFunctionalGroupsError,
    InventoryHostMissingError,
)
from core.jobs.exceptions import (
    InvalidStateTransitionError,
    JobNotFoundError,
    StageNotFoundError,
    TerminalStateViolationError,
    UpstreamStageNotCompletedError,
)
from core.jobs.value_objects import ClientId, CorrelationId, JobId
from orchestrator.build_image.commands import CreateBuildImageCommand
from orchestrator.build_image.use_cases import CreateBuildImageUseCase

router = APIRouter(prefix="/jobs", tags=["Build Image"])


def _build_error_response(
    error_code: str,
    message: str,
    correlation_id: str,
) -> BuildImageErrorResponse:
    return BuildImageErrorResponse(
        error=error_code,
        message=message,
        correlation_id=correlation_id,
        timestamp=datetime.now(timezone.utc).isoformat() + "Z",
    )


@router.post(
    "/{job_id}/stages/build-image",
    response_model=CreateBuildImageResponse,
    status_code=status.HTTP_202_ACCEPTED,
    summary="Create build image",
    description="Trigger the build-image stage for a job",
    responses={
        202: {"description": "Stage accepted", "model": CreateBuildImageResponse},
        400: {"description": "Invalid request", "model": BuildImageErrorResponse},
        401: {"description": "Unauthorized", "model": BuildImageErrorResponse},
        404: {"description": "Job not found", "model": BuildImageErrorResponse},
        409: {"description": "Stage conflict", "model": BuildImageErrorResponse},
        500: {"description": "Internal error", "model": BuildImageErrorResponse},
    },
)
def create_build_image(
    job_id: str,
    request_body: CreateBuildImageRequest,
    token_data: Annotated[dict, Depends(verify_token)] = None,  # pylint: disable=unused-argument
    use_case: CreateBuildImageUseCase = Depends(get_create_build_image_use_case),
    correlation_id: CorrelationId = Depends(get_build_image_correlation_id),
    _: None = Depends(require_job_write),
) -> CreateBuildImageResponse:
    """Trigger the build-image stage for a job.

    Accepts the request synchronously and returns 202 Accepted.
    The playbook execution is handled by the NFS queue watcher service.
    """
    # Extract client_id from validated token data
    client_id = ClientId(token_data["client_id"])

    log_secure_info(
        "info",
        f"Create build image request: job_id={job_id}, arch={request_body.architecture}, "
        f"image_key={request_body.image_key}, correlation_id={correlation_id.value}",
        identifier=str(client_id.value),
        job_id=job_id,
    )

    try:
        validated_job_id = JobId(job_id)
    except ValueError as exc:
        raise HTTPException(
            status_code=status.HTTP_400_BAD_REQUEST,
            detail=_build_error_response(
                "INVALID_JOB_ID",
                f"Invalid job_id format: {job_id}",
                correlation_id.value,
            ).model_dump(),
        ) from exc

    try:
        command = CreateBuildImageCommand(
            job_id=validated_job_id,
            client_id=client_id,
            correlation_id=correlation_id,
            architecture=request_body.architecture,
            image_key=request_body.image_key,
            functional_groups=request_body.functional_groups,
        )
        log_secure_info(
            "debug",
            f"Build image executing: job_id={job_id}, arch={request_body.architecture}, "
            f"image_key={request_body.image_key}, "
            f"functional_groups={request_body.functional_groups}",
            job_id=job_id,
        )
        result = use_case.execute(command)

        log_secure_info(
            "info",
            f"Build image success: job_id={job_id}, "
            f"arch={result.architecture}, image_key={result.image_key}, "
            f"stage={result.stage_name}, stage_status={result.status}, status=202",
            job_id=job_id,
            end_section=True,
        )

        return CreateBuildImageResponse(
            job_id=result.job_id,
            stage=result.stage_name,
            status=result.status,
            submitted_at=result.submitted_at,
            correlation_id=result.correlation_id,
            architecture=result.architecture,
            image_key=result.image_key,
            functional_groups=result.functional_groups,
        )

    except JobNotFoundError as exc:
        log_secure_info("warning", f"Build image failed: job_id={job_id}, reason=job_not_found, status=404", job_id=job_id, end_section=True)
        raise HTTPException(
            status_code=status.HTTP_404_NOT_FOUND,
            detail=_build_error_response(
                "JOB_NOT_FOUND",
                exc.message,
                correlation_id.value,
            ).model_dump(),
        ) from exc

    except StageNotFoundError as exc:
        log_secure_info("warning", f"Build image failed: job_id={job_id}, reason=stage_not_found, status=404", job_id=job_id, end_section=True)
        raise HTTPException(
            status_code=status.HTTP_404_NOT_FOUND,
            detail=_build_error_response(
                "STAGE_NOT_FOUND",
                exc.message,
                correlation_id.value,
            ).model_dump(),
        ) from exc

    except UpstreamStageNotCompletedError as exc:
        log_secure_info(
            "warning",
            f"Build image failed: job_id={job_id}, reason=upstream_stage_not_completed, status=412",
            job_id=job_id,
            end_section=True,
        )
        raise HTTPException(
            status_code=status.HTTP_412_PRECONDITION_FAILED,
            detail=_build_error_response(
                "UPSTREAM_STAGE_NOT_COMPLETED",
                exc.message,
                correlation_id.value,
            ).model_dump(),
        ) from exc

    except InvalidStateTransitionError as exc:
        log_secure_info(
            "warning",
            f"Build image failed: job_id={job_id}, reason=invalid_state_transition, status=409",
            job_id=job_id,
            end_section=True,
        )
        raise HTTPException(
            status_code=status.HTTP_409_CONFLICT,
            detail=_build_error_response(
                "INVALID_STATE_TRANSITION",
                exc.message,
                correlation_id.value,
            ).model_dump(),
        ) from exc

    except TerminalStateViolationError as exc:
        log_secure_info(
            "warning",
            f"Build image failed: job_id={job_id}, reason=terminal_state_violation, status=412",
            job_id=job_id,
            end_section=True,
        )
        if exc.state == "FAILED":
            message = f"Job {job_id} stage is in {exc.state} state and cannot be retried. Reset the stage using /stages/build-image/reset endpoint."
        else:
            message = f"Job {job_id} stage is in {exc.state} state and cannot be modified."

        raise HTTPException(
            status_code=status.HTTP_412_PRECONDITION_FAILED,
            detail=_build_error_response(
                "TERMINAL_STATE_VIOLATION",
                message,
                correlation_id.value,
            ).model_dump(),
        ) from exc

    except InvalidArchitectureError as exc:
        log_secure_info(
            "warning",
            f"Build image failed: job_id={job_id}, reason=invalid_architecture, "
            f"arch={request_body.architecture}, status=400",
            job_id=job_id,
            end_section=True,
        )
        raise HTTPException(
            status_code=status.HTTP_400_BAD_REQUEST,
            detail=_build_error_response(
                "INVALID_ARCHITECTURE",
                exc.message,
                correlation_id.value,
            ).model_dump(),
        ) from exc

    except InvalidImageKeyError as exc:
        log_secure_info(
            "warning",
            f"Build image failed: job_id={job_id}, reason=invalid_image_key, "
            f"image_key={request_body.image_key}, status=400",
            job_id=job_id,
            end_section=True,
        )
        raise HTTPException(
            status_code=status.HTTP_400_BAD_REQUEST,
            detail=_build_error_response(
                "INVALID_IMAGE_KEY",
                exc.message,
                correlation_id.value,
            ).model_dump(),
        ) from exc

    except InvalidFunctionalGroupsError as exc:
        log_secure_info(
            "warning",
            f"Build image failed: job_id={job_id}, reason=invalid_functional_groups, status=400",
            job_id=job_id,
            end_section=True,
        )
        raise HTTPException(
            status_code=status.HTTP_400_BAD_REQUEST,
            detail=_build_error_response(
                "INVALID_FUNCTIONAL_GROUPS",
                exc.message,
                correlation_id.value,
            ).model_dump(),
        ) from exc

    except InventoryHostMissingError as exc:
        log_secure_info(
            "warning",
            f"Build image failed: job_id={job_id}, reason=inventory_host_missing, status=400",
            job_id=job_id,
            end_section=True,
        )
        raise HTTPException(
            status_code=status.HTTP_400_BAD_REQUEST,
            detail=_build_error_response(
                "INVENTORY_HOST_MISSING",
                exc.message,
                correlation_id.value,
            ).model_dump(),
        ) from exc

    except BuildImageDomainError as exc:
        log_secure_info(
            "error",
            f"Build image failed: job_id={job_id}, reason=domain_error, status=500",
            job_id=job_id,
            end_section=True,
        )
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail=_build_error_response(
                "BUILD_IMAGE_ERROR",
                exc.message,
                correlation_id.value,
            ).model_dump(),
        ) from exc

    except Exception as exc:
        log_secure_info(
            "error",
            f"Build image failed: job_id={job_id}, reason=unexpected_error, status=500",
            job_id=job_id,
            exc_info=True,
            end_section=True,
        )
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail=_build_error_response(
                "INTERNAL_ERROR",
                "An unexpected error occurred",
                correlation_id.value,
            ).model_dump(),
        ) from exc


================================================
FILE: build_stream/api/build_image/schemas.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Pydantic schemas for Build Image API requests and responses."""

from typing import List, Optional
from pydantic import BaseModel, Field, field_validator


class CreateBuildImageRequest(BaseModel):
    """Request model for build image stage."""

    architecture: str = Field(
        ...,
        description="Target architecture (x86_64 or aarch64)",
        pattern="^(x86_64|aarch64)$",
    )
    image_key: str = Field(
        ...,
        description="Image identifier key",
        min_length=1,
        max_length=128,
    )
    functional_groups: List[str] = Field(
        ...,
        description="List of functional groups to build",
        min_items=1,
        max_items=50,
    )


class CreateBuildImageResponse(BaseModel):
    """Response model for build image stage acceptance (202 Accepted)."""

    job_id: str = Field(..., description="Job identifier")
    stage: str = Field(..., description="Stage identifier")
    status: str = Field(..., description="Acceptance status")
    submitted_at: str = Field(..., description="Submission timestamp (ISO 8601)")
    correlation_id: str = Field(..., description="Correlation identifier")
    architecture: str = Field(..., description="Target architecture")
    image_key: str = Field(..., description="Image identifier key")
    functional_groups: List[str] = Field(..., description="List of functional groups to build")


class BuildImageErrorResponse(BaseModel):
    """Standard error response body for build image operations."""

    error: str = Field(..., description="Error code")
    message: str = Field(..., description="Error message")
    correlation_id: str = Field(..., description="Request correlation ID")
    timestamp: str = Field(..., description="Error timestamp (ISO 8601)")


================================================
FILE: build_stream/api/catalog_roles/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


================================================
FILE: build_stream/api/catalog_roles/dependencies.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""FastAPI dependency providers for Catalog Roles API.

This module provides catalog-roles-specific dependencies like the
catalog roles service provider.
"""

from fastapi import Depends
from sqlalchemy.orm import Session

from api.dependencies import (
    get_db_session,
    _create_sql_stage_repo,
    _create_sql_job_repo,
    _get_container,
    _ENV,
)
from api.catalog_roles.service import CatalogRolesService


# ------------------------------------------------------------------
# Catalog-roles-specific dependency providers
# ------------------------------------------------------------------
def get_catalog_roles_service(
    db_session: Session = Depends(get_db_session),
) -> CatalogRolesService:
    """Provide catalog roles service with shared session in prod."""
    if _ENV == "prod":
        from infra.db.repositories import SqlArtifactMetadataRepository
        
        container = _get_container()
        return CatalogRolesService(
            artifact_store=container.artifact_store(),
            artifact_metadata_repo=SqlArtifactMetadataRepository(db_session),
            stage_repo=_create_sql_stage_repo(db_session),
            job_repo=_create_sql_job_repo(db_session),
        )
    return _get_container().catalog_roles_service() if hasattr(_get_container(), 'catalog_roles_service') else CatalogRolesService(
        artifact_store=_get_container().artifact_store(),
        artifact_metadata_repo=_get_container().artifact_metadata_repository(),
        stage_repo=_get_container().stage_repository(),
        job_repo=_get_container().job_repository(),
    )


================================================
FILE: build_stream/api/catalog_roles/routes.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""FastAPI routes for catalog roles API."""

from typing import Annotated

from fastapi import APIRouter, Depends, HTTPException, status

from api.dependencies import require_catalog_read, verify_token
from api.catalog_roles.dependencies import get_catalog_roles_service
from api.catalog_roles.schemas import ErrorResponse, GetRolesResponse
from api.logging_utils import log_secure_info
from api.catalog_roles.service import (
    CatalogRolesService,
    RolesNotFoundError,
)
from core.jobs.exceptions import JobNotFoundError, UpstreamStageNotCompletedError
from core.jobs.value_objects import JobId

router = APIRouter(prefix="/jobs", tags=["Catalog Roles"])


@router.get(
    "/{job_id}/catalog/roles",
    response_model=GetRolesResponse,
    status_code=status.HTTP_200_OK,
    summary="Get catalog metadata including roles, image_key, and architectures",
    description=(
        "Returns catalog metadata extracted from parse-catalog artifacts: "
        "roles (from functional_layer.json), image_key (catalog Identifier), "
        "and supported architectures. This metadata is used by the build-image API. "
        "The parse-catalog stage must be in COMPLETED state before calling this endpoint. "
        "Requires a valid JWT token with 'catalog:read' scope."
    ),
    responses={
        200: {
            "description": "Roles retrieved successfully",
            "model": GetRolesResponse,
        },
        401: {
            "description": "Unauthorized (missing or invalid token)",
            "model": ErrorResponse,
        },
        403: {
            "description": "Forbidden (insufficient scope)",
            "model": ErrorResponse,
        },
        404: {
            "description": "Job not found",
            "model": ErrorResponse,
        },
        422: {
            "description": "Upstream stage not completed (parse-catalog must be COMPLETED)",
            "model": ErrorResponse,
        },
        500: {
            "description": "Internal server error",
            "model": ErrorResponse,
        },
    },
)
async def get_catalog_roles(
    job_id: str,
    token_data: Annotated[dict, Depends(verify_token)] = None,  # pylint: disable=unused-argument
    scope_data: Annotated[dict, Depends(require_catalog_read)] = None,  # pylint: disable=unused-argument
    service: CatalogRolesService = Depends(get_catalog_roles_service),
) -> GetRolesResponse:
    """Return roles from the parse-catalog intermediate JSON for a given job.

    Args:
        job_id: The job identifier (UUID).
        token_data: Validated token data from JWT (injected by dependency).
        scope_data: Token data with validated 'catalog:read' scope (injected by dependency).

    Returns:
        GetRolesResponse containing the job_id and list of role names.

    Raises:
        HTTPException 400: If job_id is not a valid UUID format.
        HTTPException 401: If the Bearer token is missing or invalid.
        HTTPException 403: If the token lacks the required scope.
        HTTPException 404: If the job does not exist.
        HTTPException 422: If parse-catalog stage has not completed.
        HTTPException 500: If an unexpected error occurs.
    """
    log_secure_info(
        "info",
        f"Get catalog roles request: job_id={job_id}",
        job_id=job_id,
    )

    try:
        validated_job_id = JobId(job_id)
    except ValueError as exc:
        log_secure_info(
            "warning",
            f"Get catalog roles failed: job_id={job_id}, reason=invalid_job_id,"
            f" detail={exc}, status=400",
            job_id=job_id,
            exc_info=True,
            end_section=True,
        )
        raise HTTPException(
            status_code=status.HTTP_400_BAD_REQUEST,
            detail={
                "error_code": "INVALID_JOB_ID",
                "message": f"Invalid job_id format: {job_id}",
            },
        ) from exc

    try:
        log_secure_info(
            "debug",
            f"Get catalog roles executing: job_id={job_id}",
            job_id=job_id,
        )
        result = service.get_roles(validated_job_id)
        log_secure_info(
            "info",
            f"Get catalog roles success: job_id={job_id}, status=200",
            job_id=job_id,
            end_section=True,
        )
        return GetRolesResponse(
            job_id=job_id,
            roles=result["roles"],
            image_key=result["image_key"],
            architectures=result["architectures"],
        )

    except UpstreamStageNotCompletedError as exc:
        log_secure_info(
            "error",
            f"Get catalog roles failed: job_id={job_id}, reason=upstream_not_completed, status=412",
            job_id=job_id,
            end_section=True,
        )
        raise HTTPException(
            status_code=status.HTTP_412_PRECONDITION_FAILED,
            detail={
                "error": "UPSTREAM_STAGE_NOT_COMPLETED",
                "message": exc.message,
                "correlation_id": exc.correlation_id,
            },
        ) from exc

    except RolesNotFoundError as exc:
        log_secure_info(
            "error",
            f"Get catalog roles failed: job_id={job_id},"
            f" reason=roles_not_found, detail={exc}, status=404",
            job_id=job_id,
            exc_info=True,
            end_section=True,
        )
        raise HTTPException(
            status_code=status.HTTP_404_NOT_FOUND,
            detail={
                "error_code": "ROLES_NOT_FOUND",
                "message": str(exc),
            },
        ) from exc

    except JobNotFoundError as exc:
        log_secure_info(
            "error",
            f"Get catalog roles failed: job_id={job_id},"
            f" reason=job_not_found, status=404",
            job_id=job_id,
            end_section=True,
        )
        raise HTTPException(
            status_code=status.HTTP_404_NOT_FOUND,
            detail={
                "error_code": "JOB_NOT_FOUND",
                "message": f"Job not found: {job_id}",
            },
        ) from exc

    except Exception as exc:
        log_secure_info(
            "error",
            f"Get catalog roles failed: job_id={job_id},"
            f" reason=unexpected_error, status=500",
            job_id=job_id,
            exc_info=True,
            end_section=True,
        )
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail={
                "error_code": "INTERNAL_ERROR",
                "message": "An unexpected error occurred",
            },
        ) from exc


================================================
FILE: build_stream/api/catalog_roles/schemas.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Pydantic schemas for catalog roles API request and response models."""

from typing import List

from pydantic import BaseModel, Field


class GetRolesResponse(BaseModel):  # pylint: disable=too-few-public-methods
    """Response model for GET /jobs/{job_id}/catalog/roles."""

    job_id: str = Field(..., description="The job identifier")
    roles: List[str] = Field(..., description="List of role names from the parsed catalog")
    image_key: str = Field(..., description="Catalog identifier to use as image_key in build-image API")
    architectures: List[str] = Field(..., description="List of supported architectures (e.g., x86_64, aarch64)")

    model_config = {
        "json_schema_extra": {
            "examples": [
                {
                    "job_id": "019bf590-1234-7890-abcd-ef1234567890",
                    "roles": [
                        "login_compiler_node_x86_64",
                        "service_kube_control_plane_x86_64",
                        "service_kube_node_x86_64",
                        "slurm_control_node_x86_64",
                        "slurm_node_x86_64",
                    ],
                    "image_key": "image-build",
                    "architectures": ["aarch64", "x86_64"],
                }
            ]
        }
    }


class ErrorResponse(BaseModel):  # pylint: disable=too-few-public-methods
    """Standard error response model."""

    error_code: str = Field(..., description="Machine-readable error code")
    message: str = Field(..., description="Human-readable error message")
    correlation_id: str = Field(..., description="Request correlation identifier")


================================================
FILE: build_stream/api/catalog_roles/service.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Business logic service for catalog roles API."""

import io
import json
import logging
import zipfile
from typing import Dict, List

from core.artifacts.exceptions import ArtifactNotFoundError
from core.artifacts.interfaces import ArtifactMetadataRepository, ArtifactStore
from core.artifacts.value_objects import ArtifactKind
from core.jobs.exceptions import InvalidStateTransitionError, JobNotFoundError, UpstreamStageNotCompletedError
from core.jobs.repositories import JobRepository, StageRepository
from core.jobs.value_objects import JobId, StageName, StageState, StageType

logger = logging.getLogger(__name__)

_FUNCTIONAL_LAYER_FILENAME = "functional_layer.json"


class RolesNotFoundError(Exception):
    """Raised when no functional_layer.json can be found in the root-jsons archive."""


class CatalogRolesService:
    """Service for retrieving roles from the parse-catalog intermediate artifacts."""

    def __init__(
        self,
        artifact_store: ArtifactStore,
        artifact_metadata_repo: ArtifactMetadataRepository,
        stage_repo: StageRepository,
        job_repo: JobRepository,
    ) -> None:
        self._artifact_store = artifact_store
        self._artifact_metadata_repo = artifact_metadata_repo
        self._stage_repo = stage_repo
        self._job_repo = job_repo

    def get_roles(self, job_id: JobId) -> Dict[str, any]:
        """Return catalog metadata including roles, image_key, and architectures.

        Retrieves the root-jsons archive and catalog file artifacts stored by
        the parse-catalog stage. Validates that parse-catalog has completed.

        Args:
            job_id: The job identifier.

        Returns:
            Dictionary with keys:
                - roles: Sorted list of role name strings
                - image_key: Catalog identifier
                - architectures: List of supported architectures

        Raises:
            UpstreamStageNotCompletedError: If parse-catalog has not completed
                or artifacts are missing.
            RolesNotFoundError: If functional_layer.json cannot be parsed.
        """
        logger.info("Retrieving catalog metadata for job: %s", job_id)
        
        # Validate job exists first
        if not self._job_repo.exists(job_id):
            logger.warning(
                "Job not found for catalog metadata retrieval: %s", job_id
            )
            raise JobNotFoundError(str(job_id))
        
        # Validate parse-catalog stage is completed
        self._validate_parse_catalog_completed(job_id)

        record = self._artifact_metadata_repo.find_by_job_stage_and_label(
            job_id=job_id,
            stage_name=StageName(StageType.PARSE_CATALOG.value),
            label="root-jsons",
        )

        if record is None:
            logger.warning(
                "root-jsons artifact not found for job %s; parse-catalog may not have completed",
                job_id,
            )
            raise UpstreamStageNotCompletedError(
                job_id=str(job_id),
                required_stage="parse-catalog",
                actual_state="NOT_COMPLETED",
            )

        logger.debug(
            "Found root-jsons artifact record for job %s (key=%s)",
            job_id,
            record.artifact_ref.key.value,
        )

        try:
            raw_bytes = self._artifact_store.retrieve(
                key=record.artifact_ref.key,
                kind=ArtifactKind.FILE,
            )
        except ArtifactNotFoundError as exc:
            logger.error(
                "root-jsons artifact file missing from store for job %s", job_id
            )
            raise UpstreamStageNotCompletedError(
                job_id=str(job_id),
                required_stage="parse-catalog",
                actual_state="NOT_FOUND",
            ) from exc

        # Extract roles from functional_layer.json
        roles = self._extract_roles_from_archive(raw_bytes, job_id)
        
        # Extract catalog metadata (Identifier and architectures)
        catalog_metadata = self._extract_catalog_metadata(job_id)
        
        result = {
            "roles": roles,
            "image_key": catalog_metadata["image_key"],
            "architectures": catalog_metadata["architectures"],
        }
        
        logger.info(
            "Returning catalog metadata for job %s: %d roles, image_key=%s, %d architectures",
            job_id,
            len(roles),
            result["image_key"],
            len(result["architectures"]),
        )
        return result

    def _extract_roles_from_archive(
        self, raw_bytes: bytes, job_id: JobId
    ) -> List[str]:
        """Extract role names from the root-jsons zip archive.

        Searches all entries in the archive for any file named
        ``functional_layer.json`` and returns the sorted top-level keys
        of the first one found.

        Args:
            raw_bytes: Raw bytes of the zip archive.
            job_id: Job identifier (used only for logging).

        Returns:
            Sorted list of role name strings.

        Raises:
            RolesNotFoundError: If no functional_layer.json is found or the
                file cannot be parsed.
        """
        try:
            with zipfile.ZipFile(io.BytesIO(raw_bytes), "r") as zf:
                candidates = [
                    name
                    for name in zf.namelist()
                    if name.endswith(_FUNCTIONAL_LAYER_FILENAME)
                ]

                if not candidates:
                    logger.error(
                        "No %s found in root-jsons archive for job %s",
                        _FUNCTIONAL_LAYER_FILENAME,
                        job_id,
                    )
                    raise RolesNotFoundError(
                        f"No {_FUNCTIONAL_LAYER_FILENAME} found in the "
                        f"root-jsons archive for job: {job_id}"
                    )

                # Use the first functional_layer.json found (any arch/os/version)
                target = candidates[0]
                logger.debug(
                    "Reading roles from archive entry: %s (job=%s)", target, job_id
                )

                with zf.open(target) as f:
                    data = json.load(f)

        except zipfile.BadZipFile as exc:
            logger.error(
                "root-jsons artifact is not a valid zip archive for job %s", job_id
            )
            raise RolesNotFoundError(
                f"root-jsons artifact is not a valid archive for job: {job_id}"
            ) from exc
        except json.JSONDecodeError as exc:
            logger.error(
                "Failed to parse %s in archive for job %s",
                _FUNCTIONAL_LAYER_FILENAME,
                job_id,
            )
            raise RolesNotFoundError(
                f"Failed to parse {_FUNCTIONAL_LAYER_FILENAME} for job: {job_id}"
            ) from exc

        if not isinstance(data, dict):
            raise RolesNotFoundError(
                f"{_FUNCTIONAL_LAYER_FILENAME} does not contain a JSON object for job: {job_id}"
            )

        roles = sorted(data.keys())
        
        # Add service_kube_control_plane_first_x86 if service_kube_control_plane_x86_64 exists
        if "service_kube_control_plane_x86_64" in roles and "service_kube_control_plane_first_x86_64" not in roles:
            roles.append("service_kube_control_plane_first_x86_64")
            roles = sorted(roles)
        
        return roles

    def _validate_parse_catalog_completed(self, job_id: JobId) -> None:
        """Validate that parse-catalog stage has completed.

        Args:
            job_id: The job identifier.

        Raises:
            UpstreamStageNotCompletedError: If stage is not in COMPLETED state.
        """
        stage = self._stage_repo.find_by_job_and_name(
            job_id, StageName(StageType.PARSE_CATALOG.value)
        )

        if stage is None:
            logger.warning(
                "parse-catalog stage not found for job %s", job_id
            )
            raise UpstreamStageNotCompletedError(
                job_id=str(job_id),
                required_stage="parse-catalog",
                actual_state="NOT_FOUND",
            )

        if stage.stage_state != StageState.COMPLETED:
            logger.warning(
                "parse-catalog stage not completed for job %s (state=%s)",
                job_id,
                stage.stage_state.value,
            )
            raise UpstreamStageNotCompletedError(
                job_id=str(job_id),
                required_stage="parse-catalog",
                actual_state=stage.stage_state.value,
            )

    def _extract_catalog_metadata(self, job_id: JobId) -> Dict[str, any]:
        """Extract catalog Identifier and architectures from catalog-file artifact.

        Args:
            job_id: The job identifier.

        Returns:
            Dictionary with 'image_key' and 'architectures' keys.

        Raises:
            UpstreamStageNotCompletedError: If catalog-file artifact not found.
            RolesNotFoundError: If catalog cannot be parsed.
        """
        # Find catalog-file artifact
        catalog_record = self._artifact_metadata_repo.find_by_job_stage_and_label(
            job_id=job_id,
            stage_name=StageName(StageType.PARSE_CATALOG.value),
            label="catalog-file",
        )

        if catalog_record is None:
            logger.error(
                "catalog-file artifact not found for job %s", job_id
            )
            raise UpstreamStageNotCompletedError(
                job_id=str(job_id),
                required_stage="parse-catalog",
                actual_state="NOT_FOUND",
            )

        try:
            catalog_bytes = self._artifact_store.retrieve(
                key=catalog_record.artifact_ref.key,
                kind=ArtifactKind.FILE,
            )
        except ArtifactNotFoundError as exc:
            logger.error(
                "catalog-file missing from store for job %s", job_id
            )
            raise UpstreamStageNotCompletedError(
                job_id=str(job_id),
                required_stage="parse-catalog",
                actual_state="NOT_FOUND",
            ) from exc

        try:
            catalog_data = json.loads(catalog_bytes.decode("utf-8"))
        except (json.JSONDecodeError, UnicodeDecodeError) as exc:
            logger.error(
                "Failed to parse catalog file for job %s", job_id
            )
            raise RolesNotFoundError(
                f"Failed to parse catalog file for job: {job_id}"
            ) from exc

        # Extract Identifier (image_key)
        catalog_obj = catalog_data.get("Catalog", {})
        image_key = catalog_obj.get("Identifier", "")
        if not image_key:
            logger.warning(
                "No Identifier found in catalog for job %s", job_id
            )
            image_key = "unknown"

        # Extract architectures from functional packages
        architectures = set()
        functional_packages = catalog_obj.get("FunctionalPackages", {})
        
        # Handle both dictionary and array formats
        if isinstance(functional_packages, dict):
            # Dictionary format: {"package_id": {"Architecture": [...]}}
            for pkg_id, pkg_data in functional_packages.items():
                if isinstance(pkg_data, dict):
                    arch_list = pkg_data.get("Architecture", [])
                    if isinstance(arch_list, list):
                        architectures.update(arch_list)
                    elif isinstance(arch_list, str):
                        architectures.add(arch_list)
        elif isinstance(functional_packages, list):
            # Array format: [{"Architecture": [...]}, ...]
            for pkg in functional_packages:
                if not isinstance(pkg, dict):
                    continue
                arch_list = pkg.get("Architecture", [])
                if isinstance(arch_list, list):
                    architectures.update(arch_list)
                elif isinstance(arch_list, str):
                    architectures.add(arch_list)

        # Also check OS packages for architectures
        os_packages = catalog_obj.get("OSPackages", {})
        
        # Handle both dictionary and array formats
        if isinstance(os_packages, dict):
            # Dictionary format: {"os_package_id": {"Architecture": [...]}}
            for pkg_id, pkg_data in os_packages.items():
                if isinstance(pkg_data, dict):
                    arch_list = pkg_data.get("Architecture", [])
                    if isinstance(arch_list, list):
                        architectures.update(arch_list)
                    elif isinstance(arch_list, str):
                        architectures.add(arch_list)
        elif isinstance(os_packages, list):
            # Array format: [{"Architecture": [...]}, ...]
            for pkg in os_packages:
                if not isinstance(pkg, dict):
                    continue
                arch_list = pkg.get("Architecture", [])
                if isinstance(arch_list, list):
                    architectures.update(arch_list)
                elif isinstance(arch_list, str):
                    architectures.add(arch_list)

        return {
            "image_key": image_key,
            "architectures": sorted(list(architectures)),
        }


================================================
FILE: build_stream/api/dependencies.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Common dependencies for API endpoints.

This module provides all FastAPI dependencies including authentication,
authorization, database sessions, repositories, and domain-specific use cases.
"""

import logging
import os
from typing import Annotated, Generator

from fastapi import Depends, Header, HTTPException, status
from fastapi.security import HTTPBearer, HTTPAuthorizationCredentials
from sqlalchemy.orm import Session

from api.auth.jwt_handler import (
    JWTExpiredError,
    JWTHandler,
    JWTInvalidSignatureError,
    JWTValidationError,
)
from api.logging_utils import log_secure_info

logger = logging.getLogger(__name__)

# Environment configuration
_ENV = os.getenv("ENV", "prod")

# Authentication setup
security = HTTPBearer(auto_error=False)
_jwt_handler = JWTHandler()


def _get_container():
    """Lazy import of container to avoid circular imports."""
    from container import container  # pylint: disable=import-outside-toplevel
    return container


# ------------------------------------------------------------------
# Authentication & Authorization
# ------------------------------------------------------------------
def get_jwt_handler() -> JWTHandler:
    """Get the JWT handler instance.
    
    Returns:
        JWTHandler instance for token operations.
    """
    return _jwt_handler


def verify_token(
    credentials: Annotated[HTTPAuthorizationCredentials, Depends(security)],
    jwt_handler: Annotated[JWTHandler, Depends(get_jwt_handler)],
) -> dict:
    """Verify JWT token from Authorization header.

    Args:
        credentials: HTTP Authorization credentials from request.
        jwt_handler: JWT handler instance.

    Returns:
        Token data dictionary with client information.

    Raises:
        HTTPException: If token is missing, invalid, or expired.
    """
    if credentials is None:
        logger.warning("Request missing Authorization header")
        raise HTTPException(
            status_code=status.HTTP_401_UNAUTHORIZED,
            detail={
                "error": "missing_token",
                "error_description": "Authorization header is required",
            },
            headers={"WWW-Authenticate": "Bearer"},
        )

    try:
        token_data = jwt_handler.validate_token(credentials.credentials)
        log_secure_info("info", "Token validated successfully", token_data.client_id)

        return {
            "client_id": token_data.client_id,
            "client_name": token_data.client_name,
            "scopes": token_data.scopes,
            "token_id": token_data.token_id,
        }

    except JWTExpiredError:
        logger.warning("Token validation failed - token expired")
        raise HTTPException(
            status_code=status.HTTP_401_UNAUTHORIZED,
            detail={
                "error": "token_expired",
                "error_description": "Access token has expired",
            },
            headers={"WWW-Authenticate": "Bearer"},
        ) from None

    except JWTInvalidSignatureError:
        logger.warning("Token validation failed - invalid signature")
        raise HTTPException(
            status_code=status.HTTP_401_UNAUTHORIZED,
            detail={
                "error": "invalid_token",
                "error_description": "Invalid token signature",
            },
            headers={"WWW-Authenticate": "Bearer"},
        ) from None

    except JWTValidationError:
        logger.warning("Token validation failed: Invalid token format or content")
        raise HTTPException(
            status_code=status.HTTP_401_UNAUTHORIZED,
            detail={
                "error": "invalid_token",
                "error_description": "Invalid access token",
            },
            headers={"WWW-Authenticate": "Bearer"},
        ) from None


def require_scope(required_scope: str):
    """Create a dependency that requires a specific scope.

    Args:
        required_scope: The required scope (e.g., "catalog:read").

    Returns:
        Dependency function that validates the required scope.
    """
    def scope_dependency(
        token_data: Annotated[dict, Depends(verify_token)]
    ) -> dict:
        """Validate that the token has the required scope.

        Args:
            token_data: Token data from verify_token dependency.

        Returns:
            Token data if scope is valid.

        Raises:
            HTTPException: If required scope is not present.
        """
        if required_scope not in token_data["scopes"]:
            logger.warning(
                "Access denied - missing required scope: %s (client: %s)",
                required_scope,
                token_data["client_id"][:8] + "..."
            )
            raise HTTPException(
                status_code=status.HTTP_403_FORBIDDEN,
                detail={
                    "error": "insufficient_scope",
                    "error_description": f"Required scope '{required_scope}' is missing",
                },
            )

        logger.info(
            "Scope validation passed for client: %s, scope: %s",
            token_data["client_id"][:8] + "...",
            required_scope
        )
        return token_data

    return scope_dependency


# Common scope dependencies
require_catalog_read = require_scope("catalog:read")
require_catalog_write = require_scope("catalog:write")
require_job_write = require_scope("job:write")


# ------------------------------------------------------------------
# Database Session Management
# ------------------------------------------------------------------
def get_db_session() -> Generator[Session, None, None]:
    """Yield a single DB session per request for shared transaction context.
    
    In production, this creates a database session that is shared across
    all repositories within a single request, ensuring transactional consistency.
    In dev mode, returns None since in-memory repositories don't need sessions.
    """
    if _ENV != "prod":
        yield None  # type: ignore[misc]
        return

    from infra.db.session import SessionLocal  # pylint: disable=import-outside-toplevel
    session = SessionLocal()
    try:
        yield session
        session.commit()
    except Exception:
        session.rollback()
        raise
    finally:
        session.close()


# ------------------------------------------------------------------
# Repository Factory Helpers
# ------------------------------------------------------------------
def _create_sql_job_repo(session: Session):
    """Create SQL job repository with session."""
    from infra.db.repositories import SqlJobRepository  # pylint: disable=import-outside-toplevel
    return SqlJobRepository(session=session)


def _create_sql_stage_repo(session: Session):
    """Create SQL stage repository with session."""
    from infra.db.repositories import SqlStageRepository  # pylint: disable=import-outside-toplevel
    return SqlStageRepository(session=session)


def _create_sql_idempotency_repo(session: Session):
    """Create SQL idempotency repository with session."""
    from infra.db.repositories import SqlIdempotencyRepository  # pylint: disable=import-outside-toplevel
    return SqlIdempotencyRepository(session=session)


def _create_sql_audit_repo(session: Session):
    """Create SQL audit event repository with session."""
    from infra.db.repositories import SqlAuditEventRepository  # pylint: disable=import-outside-toplevel
    return SqlAuditEventRepository(session=session)


# ------------------------------------------------------------------
# Stage Failure Helper
# ------------------------------------------------------------------
def mark_stage_as_failed(
    job_id: str, stage_name: str, error_code: str, error_summary: str, db_session: Session = None
):
    """Mark a stage as failed when validation fails at API layer.
    
    Also marks the job as FAILED to maintain consistency with orchestrator behavior.
    
    Args:
        job_id: The job identifier
        stage_name: The stage name (e.g., 'parse-catalog')
        error_code: Error classification code
        error_summary: Human-readable error description
        db_session: Database session (if None, creates new session)
    """
    from core.jobs.value_objects import JobId, StageName  # pylint: disable=import-outside-toplevel
    from core.jobs.services import JobStateHelper  # pylint: disable=import-outside-toplevel

    try:
        # Get or create session
        if db_session is None and _ENV == "prod":
            from infra.db.session import SessionLocal  # pylint: disable=import-outside-toplevel
            db_session = SessionLocal()
            should_close = True
        else:
            should_close = False

        stage_repo = (
            _create_sql_stage_repo(db_session)
            if _ENV == "prod"
            else _get_container().stage_repository()
        )

        # Find the stage
        stage = stage_repo.find_by_job_and_name(JobId(job_id), StageName(stage_name))

        if stage and stage.stage_state.value == "PENDING":
            # Start the stage first if it's still PENDING
            stage.start()
            stage_repo.save(stage)

            # Then mark it as failed
            stage.fail(error_code=error_code, error_summary=error_summary)
            stage_repo.save(stage)

            # Commit after failing the stage
            if _ENV == "prod" and db_session.is_active:
                db_session.commit()

            # Also mark the job as FAILED (same as orchestrator)
            if _ENV == "prod":
                from infra.id_generator import UUIDv4Generator  # pylint: disable=import-outside-toplevel
                
                job_repo = _create_sql_job_repo(db_session)
                audit_repo = _create_sql_audit_repo(db_session)
                uuid_generator = UUIDv4Generator()
                
                # Transition job to IN_PROGRESS first if it's CREATED
                job = job_repo.find_by_id(JobId(job_id))
                if job and job.job_state.value == "CREATED":
                    job.start()
                    job_repo.save(job)
                    if db_session.is_active:
                        db_session.commit()
                
                JobStateHelper.handle_stage_failure(
                    job_repo=job_repo,
                    audit_repo=audit_repo,
                    uuid_generator=uuid_generator,
                    job_id=JobId(job_id),
                    stage_name=stage_name,
                    error_code=error_code,
                    error_summary=error_summary,
                    correlation_id=str(uuid_generator.generate()),
                    client_id="unknown",
                )
                
                # Ensure the session is committed after JobStateHelper completes
                if db_session.is_active:
                    db_session.commit()

        if should_close and db_session:
            db_session.close()

    except Exception as e:
        log_secure_info("warning", "Failed to mark stage as failed: %s", str(e), job_id=job_id)
        if db_session:
            db_session.rollback()


# ------------------------------------------------------------------
# Repository Providers
# ------------------------------------------------------------------
def get_job_repo(db_session: Session = Depends(get_db_session)):
    """Provide job repository with shared session in prod."""
    if _ENV == "prod":
        return _create_sql_job_repo(db_session)
    return _get_container().job_repository()


def get_stage_repo(db_session: Session = Depends(get_db_session)):
    """Provide stage repository with shared session in prod."""
    if _ENV == "prod":
        return _create_sql_stage_repo(db_session)
    return _get_container().stage_repository()

def get_audit_repo(db_session: Session = Depends(get_db_session)):
    """Provide audit event repository."""
    if _ENV == "prod":
        return _create_sql_audit_repo(db_session)
    return _get_container().audit_repository()


# ------------------------------------------------------------------
# Job-Specific Dependencies
# ------------------------------------------------------------------
from core.jobs.value_objects import ClientId, CorrelationId
from infra.id_generator import JobUUIDGenerator
from orchestrator.jobs.use_cases import CreateJobUseCase


def get_id_generator() -> JobUUIDGenerator:
    """Provide job ID generator."""
    return _get_container().job_id_generator()


def get_client_id(token_data: dict) -> ClientId:
    """Extract ClientId from verified token data.
    
    Note: token_data comes from verify_token dependency injected in the route.
    This function is called after verify_token has already validated the JWT.
    
    Args:
        token_data: Token data dict from verify_token dependency.
        
    Returns:
        ClientId extracted from token.
    """
    return ClientId(token_data["client_id"])


def get_correlation_id(
    x_correlation_id: Annotated[str, Header(
        alias="X-Correlation-Id",
        description="Request tracing ID",
    )] = None,
) -> CorrelationId:
    """Return provided correlation ID or generate one."""
    generator = _get_container().uuid_generator()
    if x_correlation_id:
        try:
            correlation_id = CorrelationId(x_correlation_id)
            return correlation_id
        except ValueError:
            pass

    generated_id = generator.generate()
    return CorrelationId(str(generated_id))


def get_idempotency_key(
    idempotency_key: Annotated[str, Header(
        alias="Idempotency-Key",
        description="Client-provided deduplication token",
    )] = None,
) -> str:
    """Validate and return the Idempotency-Key header."""
    if idempotency_key is None or not idempotency_key.strip():
        raise HTTPException(
            status_code=status.HTTP_422_UNPROCESSABLE_CONTENT,
            detail="Idempotency-Key must be provided",
        )

    key = idempotency_key.strip()

    if len(key) > 255:
        raise HTTPException(
            status_code=status.HTTP_422_UNPROCESSABLE_CONTENT,
            detail="Idempotency-Key length must be <= 255 characters",
        )

    return key


def get_create_job_use_case(
    db_session: Session = Depends(get_db_session),
) -> CreateJobUseCase:
    """Provide create-job use case with shared session in prod."""
    if _ENV == "prod":
        container = _get_container()
        return CreateJobUseCase(
            job_repo=_create_sql_job_repo(db_session),
            stage_repo=_create_sql_stage_repo(db_session),
            idempotency_repo=_create_sql_idempotency_repo(db_session),
            audit_repo=_create_sql_audit_repo(db_session),
            job_id_generator=container.job_id_generator(),
            uuid_generator=container.uuid_generator(),
        )
    return _get_container().create_job_use_case()


================================================
FILE: build_stream/api/generate_input_files/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""GenerateInputFiles API module."""

from api.generate_input_files.routes import router

__all__ = ["router"]


================================================
FILE: build_stream/api/generate_input_files/dependencies.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""FastAPI dependency providers for GenerateInputFiles API.

This module provides generate-input-files-specific dependencies like the
generate input files use case provider.
"""

from fastapi import Depends
from sqlalchemy.orm import Session

from api.dependencies import (
    get_db_session,
    _create_sql_job_repo,
    _create_sql_stage_repo,
    _create_sql_audit_repo,
    _get_container,
    _ENV,
)
from orchestrator.catalog.use_cases import GenerateInputFilesUseCase


# ------------------------------------------------------------------
# Generate-input-files-specific dependency providers
# ------------------------------------------------------------------
def get_generate_input_files_use_case(
    db_session: Session = Depends(get_db_session),
) -> GenerateInputFilesUseCase:
    """Provide generate-input-files use case with shared session in prod."""
    if _ENV == "prod":
        from infra.db.repositories import SqlArtifactMetadataRepository
        
        container = _get_container()
        return GenerateInputFilesUseCase(
            job_repo=_create_sql_job_repo(db_session),
            stage_repo=_create_sql_stage_repo(db_session),
            audit_repo=_create_sql_audit_repo(db_session),
            artifact_store=container.artifact_store(),
            artifact_metadata_repo=SqlArtifactMetadataRepository(db_session),
            uuid_generator=container.uuid_generator(),
            default_policy_path=container.default_policy_path(),
            policy_schema_path=container.policy_schema_path(),
        )
    return _get_container().generate_input_files_use_case()


================================================
FILE: build_stream/api/generate_input_files/routes.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""FastAPI routes for GenerateInputFiles API."""

import uuid
from typing import Annotated, Optional

from fastapi import APIRouter, Body, Depends, HTTPException, status

from api.dependencies import require_catalog_read, verify_token, mark_stage_as_failed, get_db_session
from api.generate_input_files.dependencies import get_generate_input_files_use_case
from api.logging_utils import log_secure_info
from core.artifacts.exceptions import ArtifactNotFoundError
from core.artifacts.value_objects import SafePath
from core.catalog.exceptions import (
    AdapterPolicyValidationError,
    ConfigGenerationError,
)
from core.jobs.exceptions import (
    JobNotFoundError,
    StageAlreadyCompletedError,
    TerminalStateViolationError,
    UpstreamStageNotCompletedError,
)
from core.jobs.value_objects import CorrelationId, JobId
from orchestrator.catalog.commands.generate_input_files import (
    GenerateInputFilesCommand,
)
from orchestrator.catalog.use_cases import GenerateInputFilesUseCase

from api.generate_input_files.schemas import (
    ArtifactRefResponse,
    ErrorResponse,
    GenerateInputFilesRequest,
    GenerateInputFilesResponse,
)

router = APIRouter(prefix="/jobs", tags=["Input File Generation"])


@router.post(
    "/{job_id}/stages/generate-input-files",
    response_model=GenerateInputFilesResponse,
    status_code=status.HTTP_200_OK,
    summary="Generate input files from parsed catalog",
    responses={
        400: {"description": "Invalid request", "model": ErrorResponse},
        404: {"description": "Job not found", "model": ErrorResponse},
        409: {"description": "Stage already completed", "model": ErrorResponse},
        422: {"description": "Upstream stage not completed", "model": ErrorResponse},
        500: {"description": "Internal server error", "model": ErrorResponse},
    },
)
async def generate_input_files(
    job_id: str,
    request_body: Optional[GenerateInputFilesRequest] = Body(default=None),
    token_data: Annotated[dict, Depends(verify_token)] = None,  # pylint: disable=unused-argument
    scope_data: Annotated[dict, Depends(require_catalog_read)] = None,  # pylint: disable=unused-argument
    use_case: Annotated[GenerateInputFilesUseCase, Depends(get_generate_input_files_use_case)] = None,
    db_session = Depends(get_db_session),
) -> GenerateInputFilesResponse:
    """Generate Omnia input files from a parsed catalog.

    Args:
        job_id: The job identifier.
        request_body: Optional request with custom adapter policy path.
        token_data: Validated token data from JWT (injected by dependency).
        scope_data: Token data with validated scope (injected by dependency).

    Returns:
        GenerateInputFilesResponse with generated config details.
    """
    correlation_id = str(uuid.uuid4())

    adapter_path_str = (
        request_body.adapter_policy_path if request_body and request_body.adapter_policy_path else "default"
    )
    log_secure_info(
        "info",
        f"Generate-input-files request: job_id={job_id}, "
        f"adapter_policy={adapter_path_str}, correlation_id={correlation_id}",
        job_id=job_id,
    )

    try:
        validated_job_id = JobId(job_id)
    except ValueError as e:
        log_secure_info("error", f"Generate-input-files failed: job_id={job_id}, reason=invalid_job_id, status=400", job_id=job_id, end_section=True)
        raise HTTPException(
            status_code=status.HTTP_400_BAD_REQUEST,
            detail={"error": "INVALID_JOB_ID", "message": str(e)},
        ) from e

    adapter_policy_path = None
    if request_body and request_body.adapter_policy_path:
        try:
            adapter_policy_path = SafePath.from_string(
                request_body.adapter_policy_path
            )
        except ValueError as e:
            log_secure_info("error", f"Generate-input-files failed: job_id={job_id}, reason=invalid_policy_path, status=400", job_id=job_id, end_section=True)
            # Mark stage as failed since validation failed at API layer
            mark_stage_as_failed(job_id, "generate-input-files", "INVALID_POLICY_PATH", str(e), db_session)
            raise HTTPException(
                status_code=status.HTTP_400_BAD_REQUEST,
                detail={"error": "INVALID_POLICY_PATH", "message": str(e)},
            ) from e

    command = GenerateInputFilesCommand(
        job_id=validated_job_id,
        correlation_id=CorrelationId(correlation_id),
        adapter_policy_path=adapter_policy_path,
    )

    try:
        result = use_case.execute(command)
        log_secure_info(
            "debug",
            f"Generate-input-files executing: job_id={job_id}, "
            f"adapter_policy={adapter_path_str}, correlation_id={correlation_id}",
            job_id=job_id,
        )

        log_secure_info(
            "info",
            f"Generate-input-files success: job_id={job_id}, "
            f"config_file_count={result.config_file_count}, stage_state={result.stage_state}, status=200",
            job_id=job_id,
            end_section=True,
        )

        return GenerateInputFilesResponse(
            job_id=result.job_id,
            stage_state=result.stage_state,
            message=result.message,
            configs_ref=ArtifactRefResponse(
                key=str(result.configs_ref.key),
                digest=str(result.configs_ref.digest),
                size_bytes=result.configs_ref.size_bytes,
                uri=result.configs_ref.uri,
            ),
            config_file_count=result.config_file_count,
            config_files=result.config_files,
            completed_at=result.completed_at,
        )

    except JobNotFoundError as e:
        log_secure_info("error", f"Generate-input-files failed: job_id={job_id}, reason=job_not_found, status=404", job_id=job_id, end_section=True)
        raise HTTPException(
            status_code=status.HTTP_404_NOT_FOUND,
            detail={"error": "JOB_NOT_FOUND", "message": e.message},
        ) from e

    except TerminalStateViolationError as e:
        log_secure_info("error", f"Generate-input-files failed: job_id={job_id}, reason=terminal_state, status=409", job_id=job_id, end_section=True)
        raise HTTPException(
            status_code=status.HTTP_409_CONFLICT,
            detail={"error": "TERMINAL_STATE", "message": e.message},
        ) from e

    except StageAlreadyCompletedError as e:
        log_secure_info("error", f"Generate-input-files failed: job_id={job_id}, reason=stage_already_completed, status=409", job_id=job_id, end_section=True)
        raise HTTPException(
            status_code=status.HTTP_409_CONFLICT,
            detail={"error": "STAGE_ALREADY_COMPLETED", "message": e.message},
        ) from e

    except UpstreamStageNotCompletedError as e:
        log_secure_info("error", f"Generate-input-files failed: job_id={job_id}, reason=upstream_not_completed, status=412", job_id=job_id, end_section=True)
        raise HTTPException(
            status_code=status.HTTP_412_PRECONDITION_FAILED,
            detail={
                "error": "UPSTREAM_STAGE_NOT_COMPLETED",
                "message": e.message,
            },
        ) from e

    except ArtifactNotFoundError as e:
        log_secure_info("error", f"Generate-input-files failed: job_id={job_id}, reason=upstream_artifact_not_found, status=422", job_id=job_id, end_section=True)
        raise HTTPException(
            status_code=status.HTTP_422_UNPROCESSABLE_ENTITY,
            detail={
                "error": "UPSTREAM_ARTIFACT_NOT_FOUND",
                "message": e.message,
            },
        ) from e

    except (AdapterPolicyValidationError, ConfigGenerationError) as e:
        log_secure_info("error", f"Generate-input-files failed: job_id={job_id}, reason=config_generation_failed, status=500", job_id=job_id, end_section=True)
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail={"error": "CONFIG_GENERATION_FAILED", "message": e.message},
        ) from e

    except Exception as e:
        log_secure_info("error", f"Generate-input-files failed: job_id={job_id}, reason=unexpected_error, status=500", job_id=job_id, exc_info=True, end_section=True)
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail={"error": "INTERNAL_ERROR", "message": "An unexpected error occurred"},
        ) from e


================================================
FILE: build_stream/api/generate_input_files/schemas.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Pydantic schemas for GenerateInputFiles API."""

from typing import List, Optional, Tuple

from pydantic import BaseModel, Field


class GenerateInputFilesRequest(BaseModel):
    """Request model for GenerateInputFiles API."""

    adapter_policy_path: Optional[str] = Field(
        default=None,
        max_length=4096,
        description="Optional custom adapter policy path. Uses default if omitted.",
    )


class ArtifactRefResponse(BaseModel):
    """Artifact reference in API responses."""

    key: str = Field(..., description="Artifact key")
    digest: str = Field(..., description="SHA-256 content digest")
    size_bytes: int = Field(..., description="Content size in bytes")
    uri: str = Field(..., description="Storage URI")


class GenerateInputFilesResponse(BaseModel):
    """Response model for GenerateInputFiles API."""

    job_id: str = Field(..., description="Job identifier")
    stage_state: str = Field(..., description="Stage state after execution")
    message: str = Field(..., description="Human-readable result message")


class ErrorResponse(BaseModel):
    """Standard error response model."""

    error: str = Field(..., description="Error code")
    message: str = Field(..., description="Error message")
    correlation_id: Optional[str] = Field(
        default=None, description="Correlation ID for tracing"
    )


================================================
FILE: build_stream/api/jobs/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

__all__ = []


================================================
FILE: build_stream/api/jobs/dependencies.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""FastAPI dependency providers for Jobs API.

This module re-exports job-specific dependencies from the main dependencies module
to maintain backward compatibility.
"""

# Re-export only the dependencies that are actually used
from api.dependencies import (
    # Job-specific
    get_correlation_id,
    get_idempotency_key,
    get_create_job_use_case,
    get_job_repo,
    get_stage_repo,
    get_audit_repo,
)


================================================
FILE: build_stream/api/jobs/routes.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""FastAPI routes for job lifecycle operations."""

from datetime import datetime, timezone
from typing import Annotated

from fastapi import APIRouter, Depends, HTTPException, Response, status

from core.jobs.exceptions import (
    IdempotencyConflictError,
    InvalidStateTransitionError,
    JobNotFoundError,
)
from core.jobs.repositories import AuditEventRepository
from core.jobs.value_objects import (
    ClientId,
    CorrelationId,
    IdempotencyKey,
    JobId,
    JobState,
)
from orchestrator.jobs.commands import CreateJobCommand
from orchestrator.jobs.use_cases import CreateJobUseCase

from api.logging_utils import create_job_log_file, log_secure_info, remove_job_logger
from api.dependencies import verify_token
from api.logging_utils import create_job_log_file, log_secure_info, remove_job_logger
from api.jobs.dependencies import (
    get_audit_repo,
    get_correlation_id,
    get_create_job_use_case,
    get_idempotency_key,
    get_job_repo,
    get_stage_repo,
)
from api.jobs.schemas import (
    CreateJobRequest,
    CreateJobResponse,
    CreateStageResponse,
    ErrorResponse,
    GetJobResponse,
    GetStageResponse,
)
from api.catalog_roles.dependencies import get_catalog_roles_service
from api.catalog_roles.service import CatalogRolesService

router = APIRouter(prefix="/jobs", tags=["Jobs"])


def _map_job_state_to_api_state(internal_state: JobState) -> str:
    """Map internal job state to API response state."""
    state_mapping = {
        JobState.CREATED: "PENDING",
        JobState.IN_PROGRESS: "RUNNING",
        JobState.COMPLETED: "SUCCEEDED",
        JobState.FAILED: "FAILED",
        JobState.CANCELLED: "CLEANED",
    }
    return state_mapping.get(internal_state, "UNKNOWN")


def _build_error_response(
    error_code: str,
    message: str,
    correlation_id: str,
) -> ErrorResponse:
    return ErrorResponse(
        error=error_code,
        message=message,
        correlation_id=correlation_id,
        timestamp=datetime.now(timezone.utc).isoformat() + "Z",
    )


@router.post(
    "",
    response_model=CreateJobResponse,
    status_code=status.HTTP_201_CREATED,
    responses={
        200: {"description": "Idempotent replay", "model": CreateJobResponse},
        201: {"description": "Job created", "model": CreateJobResponse},
        400: {"description": "Invalid request", "model": ErrorResponse},
        401: {"description": "Unauthorized", "model": ErrorResponse},
        409: {"description": "Idempotency conflict", "model": ErrorResponse},
        422: {"description": "Validation error", "model": ErrorResponse},
        500: {"description": "Internal error", "model": ErrorResponse},
    },
)
async def create_job(
    request: CreateJobRequest,
    response: Response,
    token_data: Annotated[dict, Depends(verify_token)],
    correlation_id: CorrelationId = Depends(get_correlation_id),
    idempotency_key: str = Depends(get_idempotency_key),
    use_case: CreateJobUseCase = Depends(get_create_job_use_case),
    stage_repo = Depends(get_stage_repo),
) -> CreateJobResponse:
    """Create a job, handling idempotency and domain errors."""
    # pylint: disable=too-many-arguments,too-many-positional-arguments
    client_id = ClientId(token_data["client_id"])

    log_secure_info(
        "info",
        f"Create job request: client_name={request.client_name}, "
        f"correlation_id={correlation_id.value}",
        identifier=idempotency_key,
    )

    try:
        command = CreateJobCommand(
            client_id=client_id,
            request_client_id=request.client_id,
            client_name=request.client_name,
            correlation_id=correlation_id,
            idempotency_key=IdempotencyKey(idempotency_key),
        )
        log_secure_info(
            "debug",
            f"Create job executing: client_id={client_id.value}, "
            f"client_name={request.client_name}, idempotency_key={idempotency_key}",
        )
        log_secure_info(
            "debug",
            f"Create job executing: client_id={client_id.value}, "
            f"client_name={request.client_name}, idempotency_key={idempotency_key}",
        )
        result = use_case.execute(command)

        if result.is_new:
            response.status_code = status.HTTP_201_CREATED
            log_path = create_job_log_file(result.job_id)
            log_secure_info(
                "info",
                f"Job created: job_id={result.job_id}, "
                f"client_name={request.client_name}, log_file={log_path}",
                identifier=correlation_id.value,
                job_id=result.job_id,
            )
            log_path = create_job_log_file(result.job_id)
            log_secure_info(
                "info",
                f"Job created: job_id={result.job_id}, "
                f"client_name={request.client_name}, log_file={log_path}",
                identifier=correlation_id.value,
                job_id=result.job_id,
            )
        else:
            response.status_code = status.HTTP_200_OK
            log_secure_info(
                "info",
                f"Idempotent replay: job_id={result.job_id}, "
                f"job_state={result.job_state}",
                identifier=correlation_id.value,
                job_id=result.job_id,
            )

            log_secure_info(
                "info",
                f"Idempotent replay: job_id={result.job_id}, "
                f"job_state={result.job_state}",
                identifier=correlation_id.value,
                job_id=result.job_id,
            )

        stages_entities = stage_repo.find_all_by_job(JobId(result.job_id))  # pylint: disable=no-member
        stages = [
            CreateStageResponse(
                stage_name=str(s.stage_name),
                stage_state=s.stage_state.value,
                started_at=s.started_at.isoformat() + "Z" if s.started_at else None,
                ended_at=s.ended_at.isoformat() + "Z" if s.ended_at else None,
                error_code=s.error_code,
                error_summary=s.error_summary,
            )
            for s in stages_entities
        ]
        log_secure_info(
            "info",
            f"Create job response: job_id={result.job_id}, "
            f"job_state={result.job_state}, status=201",
            job_id=result.job_id,
            end_section=True,
        )
        log_secure_info(
            "info",
            f"Create job response: job_id={result.job_id}, "
            f"job_state={result.job_state}, status=201",
            job_id=result.job_id,
            end_section=True,
        )
        return CreateJobResponse(
            job_id=result.job_id,
            correlation_id=correlation_id.value,
            job_state=result.job_state,
            created_at=result.created_at,
            stages=stages,
        )

    except IdempotencyConflictError as e:
        log_secure_info(
            "warning",
            f"Create job failed: reason=idempotency_conflict, status=409",
            job_id=None,
            end_section=True,
        )
        raise HTTPException(
            status_code=status.HTTP_409_CONFLICT,
            detail=_build_error_response(
                "IDEMPOTENCY_CONFLICT",
                e.message,
                correlation_id.value,
            ).model_dump(),
        ) from e

    except Exception as e:
        log_secure_info(
            "error",
            "Create job failed: reason=unexpected_error, status=500",
            exc_info=True,
            end_section=True,
        )
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail=_build_error_response(
                "INTERNAL_ERROR",
                "An unexpected error occurred",
                correlation_id.value,
            ).model_dump(),
        ) from e


@router.get(
    "/{job_id}",
    response_model=GetJobResponse,
    responses={
        200: {"description": "Job retrieved", "model": GetJobResponse},
        400: {"description": "Invalid job_id", "model": ErrorResponse},
        401: {"description": "Unauthorized", "model": ErrorResponse},
        404: {"description": "Job not found", "model": ErrorResponse},
        500: {"description": "Internal error", "model": ErrorResponse},
    },
)
async def get_job(
    job_id: str,
    token_data: Annotated[dict, Depends(verify_token)],
    correlation_id: CorrelationId = Depends(get_correlation_id),
    job_repo = Depends(get_job_repo),
    stage_repo = Depends(get_stage_repo),
    audit_repo = Depends(get_audit_repo),
    catalog_roles_service: CatalogRolesService = Depends(get_catalog_roles_service),
) -> GetJobResponse:
    """Return a job if it exists for the requesting client."""

    client_id = ClientId(token_data["client_id"])

    log_secure_info(
        "info",
        f"Get job request: job_id={job_id}, correlation_id={correlation_id.value}",
        identifier=client_id.value,
        job_id=job_id,
    )

    try:
        validated_job_id = JobId(job_id)
    except ValueError as e:
        raise HTTPException(
            status_code=status.HTTP_400_BAD_REQUEST,
            detail=_build_error_response(
                "INVALID_JOB_ID",
                f"Invalid job_id format: {job_id}",
                correlation_id.value,
            ).model_dump(),
        ) from e

    try:
        log_secure_info(
            "debug",
            f"Get job lookup: job_id={job_id}, client_id={client_id.value}",
            job_id=job_id,
        )
        log_secure_info(
            "debug",
            f"Get job lookup: job_id={job_id}, client_id={client_id.value}",
            job_id=job_id,
        )
        job = job_repo.find_by_id(validated_job_id)  # pylint: disable=no-member
        if job is None or job.tombstoned:
            raise JobNotFoundError(job_id, correlation_id.value)

        if job.client_id != client_id:
            raise JobNotFoundError(job_id, correlation_id.value)

        # Get stage breakdown
        stages_entities = stage_repo.find_all_by_job(validated_job_id)  # pylint: disable=no-member
        
        # Try to get supported architectures from catalog to filter build-image stages
        supported_architectures = []
        try:
            catalog_roles = catalog_roles_service.get_roles(validated_job_id)
            # catalog_roles returns a dict, not a Pydantic model
            if isinstance(catalog_roles, dict):
                supported_architectures = catalog_roles.get("architectures", [])
                log_secure_info(
                    "debug",
                    f"Filtering build-image stages for job {job_id}: "
                    f"supported_architectures={supported_architectures}",
                    job_id=job_id,
                )
            else:
                log_secure_info(
                    "warning",
                    f"Unexpected catalog roles type for job {job_id}: "
                    f"{type(catalog_roles).__name__}",
                    job_id=job_id,
                )
                supported_architectures = []
        except AttributeError as e:
            # Specific handling for attribute errors
            log_secure_info(
                "warning",
                f"AttributeError getting catalog roles for job {job_id}",
                job_id=job_id,
            )
            supported_architectures = []
        except Exception as e:
            # If catalog roles are not available, include all stages (fallback behavior)
            log_secure_info(
                "warning",
                f"Could not get catalog roles for job {job_id}, including all stages",
                job_id=job_id,
            )
            supported_architectures = []
        
        # Filter stages based on supported architectures
        filtered_stages = []
        for s in stages_entities:
            stage_name = str(s.stage_name)
            
            # Check if this is a build-image stage
            if stage_name.startswith("build-image-"):
                # Extract architecture from stage name (e.g., "build-image-x86_64" -> "x86_64")
                stage_arch = stage_name.replace("build-image-", "")
                
                # Only include this build-image stage if the architecture is supported
                if not supported_architectures or stage_arch in supported_architectures:
                    filtered_stages.append(s)
                else:
                    log_secure_info(
                        "debug",
                        f"Filtering out build-image stage for unsupported "
                        f"architecture: job_id={job_id}, stage={stage_name}, "
                        f"arch={stage_arch}",
                        job_id=job_id,
                    )
            else:
                # Include all non-build-image stages
                filtered_stages.append(s)
        
        stages = [
            GetStageResponse(
                stage_name=str(s.stage_name),
                stage_state=s.stage_state.value,
                started_at=s.started_at.isoformat() + "Z" if s.started_at else None,
                ended_at=s.ended_at.isoformat() + "Z" if s.ended_at else None,
                error_code=s.error_code,
                error_summary=s.error_summary,
                log_file_path=s.log_file_path,
            )
            for s in filtered_stages
        ]
        
        # Get audit events for state change timestamps
        audit_events = audit_repo.find_by_job(validated_job_id)  # pylint: disable=no-member
        state_timestamps = {}
        for event in audit_events:
            if event.event_type.startswith("JOB_"):
                state_name = event.event_type.replace("JOB_", "")
                if state_name in ["CREATED", "IN_PROGRESS", "COMPLETED", "FAILED", "CANCELLED"]:
                    state_timestamps[state_name] = event.timestamp.isoformat() + "Z"
        
        # Always include creation timestamp
        if "CREATED" not in state_timestamps and job.created_at:
            state_timestamps["CREATED"] = job.created_at.isoformat() + "Z"
        
        log_secure_info(
            "info",
            f"Get job success: job_id={job_id}, "
            f"job_state={_map_job_state_to_api_state(job.job_state)}, "
            f"status=200",
            job_id=job_id,
            end_section=True,
        )
        return GetJobResponse(
            job_id=str(job.job_id),
            correlation_id=correlation_id.value,
            job_state=_map_job_state_to_api_state(job.job_state),
            created_at=job.created_at.isoformat() + "Z",
            updated_at=job.updated_at.isoformat() + "Z" if job.updated_at else None,
            tombstone=job.tombstoned,
            stages=stages,
            state_timestamps=state_timestamps if state_timestamps else None,
        )

    except JobNotFoundError as e:
        log_secure_info(
            "warning",
            f"Get job failed: job_id={job_id}, "
            f"reason=not_found, status=404",
            job_id=job_id,
            end_section=True,
        )
        raise HTTPException(
            status_code=status.HTTP_404_NOT_FOUND,
            detail=_build_error_response(
                "JOB_NOT_FOUND",
                e.message,
                correlation_id.value,
            ).model_dump(),
        ) from e

    except Exception as e:
        log_secure_info(
            "error",
            f"Get job failed: job_id={job_id}, "
            f"reason=unexpected_error, status=500",
            job_id=job_id,
            exc_info=True,
            end_section=True,
        )
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail=_build_error_response(
                "INTERNAL_ERROR",
                "An unexpected error occurred",
                correlation_id.value,
            ).model_dump(),
        ) from e


@router.delete(
    "/{job_id}",
    status_code=status.HTTP_204_NO_CONTENT,
    responses={
        204: {"description": "Job deleted successfully"},
        400: {"description": "Invalid job_id", "model": ErrorResponse},
        401: {"description": "Unauthorized", "model": ErrorResponse},
        404: {"description": "Job not found", "model": ErrorResponse},
        500: {"description": "Internal error", "model": ErrorResponse},
    },
)
async def delete_job(
    job_id: str,
    token_data: Annotated[dict, Depends(verify_token)],
    correlation_id: CorrelationId = Depends(get_correlation_id),
    job_repo = Depends(get_job_repo),
    stage_repo = Depends(get_stage_repo),
) -> None:
    """Delete (tombstone) a job for the requesting client if it exists."""
    client_id = ClientId(token_data["client_id"])

    log_secure_info(
        "info",
        f"Delete job request: job_id={job_id}, correlation_id={correlation_id.value}",
        identifier=client_id.value,
        job_id=job_id,
    )

    try:
        validated_job_id = JobId(job_id)
    except ValueError as e:
        raise HTTPException(
            status_code=status.HTTP_400_BAD_REQUEST,
            detail=_build_error_response(
                "INVALID_JOB_ID",
                f"Invalid job_id format: {job_id}",
                correlation_id.value,
            ).model_dump(),
        ) from e

    try:
        log_secure_info(
            "debug",
            f"Delete job lookup: job_id={job_id}, client_id={client_id.value}",
            job_id=job_id,
        )
        log_secure_info(
            "debug",
            f"Delete job lookup: job_id={job_id}, client_id={client_id.value}",
            job_id=job_id,
        )
        job = job_repo.find_by_id(validated_job_id)  # pylint: disable=no-member
        if job is None:
            raise JobNotFoundError(job_id, correlation_id.value)

        if job.client_id != client_id:
            raise JobNotFoundError(job_id, correlation_id.value)

        job.tombstone()
        job_repo.save(job)  # pylint: disable=no-member

        stages_entities = stage_repo.find_all_by_job(validated_job_id)  # pylint: disable=no-member
        cancelled_count = 0
        for stage in stages_entities:
            if not stage.stage_state.is_terminal():
                stage.cancel()
                stage_repo.save(stage)  # pylint: disable=no-member
                cancelled_count += 1

        log_secure_info(
            "info",
            f"Delete job success: job_id={job_id}, "
            f"stages_cancelled={cancelled_count}, status=204",
            job_id=job_id,
            end_section=True,
        )
        remove_job_logger(job_id)
        cancelled_count += 1

        log_secure_info(
            "info",
            f"Delete job success: job_id={job_id}, "
            f"stages_cancelled={cancelled_count}, status=204",
            job_id=job_id,
            end_section=True,
        )
        remove_job_logger(job_id)

    except JobNotFoundError as e:
        log_secure_info(
            "warning",
            f"Delete job failed: job_id={job_id}, "
            f"reason=not_found, status=404",
            job_id=job_id,
            end_section=True,
        )
        raise HTTPException(
            status_code=status.HTTP_404_NOT_FOUND,
            detail=_build_error_response(
                "JOB_NOT_FOUND",
                e.message,
                correlation_id.value,
            ).model_dump(),
        ) from e

    except InvalidStateTransitionError as e:
        log_secure_info(
            "warning",
            f"Delete job failed: job_id={job_id}, "
            f"reason=invalid_state_transition, status=400",
            job_id=job_id,
            end_section=True,
        )
        raise HTTPException(
            status_code=status.HTTP_400_BAD_REQUEST,
            detail=_build_error_response(
                "INVALID_STATE_TRANSITION",
                e.message,
                correlation_id.value,
            ).model_dump(),
        ) from e

    except Exception as e:
        log_secure_info(
            "error",
            f"Delete job failed: job_id={job_id}, "
            f"reason=unexpected_error, status=500",
            job_id=job_id,
            exc_info=True,
            end_section=True,
        )
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail=_build_error_response(
                "INTERNAL_ERROR",
                "An unexpected error occurred",
                correlation_id.value,
            ).model_dump(),
        ) from e


================================================
FILE: build_stream/api/jobs/schemas.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Pydantic schemas for Jobs API requests and responses."""

from datetime import datetime
from typing import Any, Dict, List, Optional

from pydantic import BaseModel, Field, field_validator


class CreateJobRequest(BaseModel):
    """Request payload for creating a job."""

    client_id: str = Field(
        ...,
        min_length=1,
        max_length=255,
        description="Client identifier",
    )
    client_name: Optional[str] = Field(
        default=None,
        min_length=1,
        max_length=255,
        description="Optional client name",
    )
    metadata: Optional[Dict[str, Any]] = Field(
        default=None,
        description="Optional metadata describing the job",
    )
    parameters: Optional[Dict[str, Any]] = Field(
        default=None,
        description="Additional parameters for job execution",
    )

    model_config = {"populate_by_name": True}

    @field_validator("client_id")
    @classmethod
    def validate_client_id(cls, v: str) -> str:
        """Validate client_id."""
        if not v.strip():
            raise ValueError("client_id cannot be empty")
        return v.strip()

    @field_validator("client_name")
    @classmethod
    def validate_client_name(cls, v: Optional[str]) -> Optional[str]:
        """Validate client name when provided."""
        if v is None:
            return None
        if not v.strip():
            raise ValueError("client_name cannot be empty")
        return v.strip()


class CreateStageResponse(BaseModel):
    """Response model for a stage entry in create job response."""
    stage_name: str = Field(..., description="Stage identifier")
    stage_state: str = Field(..., description="Stage state")
    started_at: Optional[str] = Field(default=None, description="Start timestamp (ISO 8601)")
    ended_at: Optional[str] = Field(default=None, description="End timestamp (ISO 8601)")
    error_code: Optional[str] = Field(default=None, description="Error code if failed")
    error_summary: Optional[str] = Field(default=None, description="Error summary if failed")


class GetStageResponse(BaseModel):
    """Response model for a stage entry in get job response."""
    stage_name: str = Field(..., description="Stage identifier")
    stage_state: str = Field(..., description="Stage state")
    started_at: Optional[str] = Field(default=None, description="Start timestamp (ISO 8601)")
    ended_at: Optional[str] = Field(default=None, description="End timestamp (ISO 8601)")
    error_code: Optional[str] = Field(default=None, description="Error code if failed")
    error_summary: Optional[str] = Field(default=None, description="Error summary if failed")
    log_file_path: Optional[str] = Field(default=None, description="Ansible log file path on OIM host (NFS share)")


class CreateJobResponse(BaseModel):
    """Response model for job creation."""
    job_id: str = Field(..., description="Job identifier")
    correlation_id: str = Field(..., description="Correlation identifier")
    job_state: str = Field(..., description="Job state")
    created_at: str = Field(..., description="Creation timestamp (ISO 8601)")
    stages: List[CreateStageResponse] = Field(..., description="Job stages")


class GetJobResponse(BaseModel):
    """Response model for retrieving a job."""
    job_id: str = Field(..., description="Job identifier")
    correlation_id: str = Field(..., description="Correlation identifier")
    job_state: str = Field(..., description="Job state (PENDING, RUNNING, SUCCEEDED, FAILED, CLEANED)")
    created_at: str = Field(..., description="Creation timestamp (ISO 8601)")
    updated_at: Optional[str] = Field(
        default=None, description="Update timestamp (ISO 8601)"
    )
    tombstone: Optional[bool] = Field(default=None, description="Tombstone flag")
    stages: List[GetStageResponse] = Field(..., description="Job stages (step breakdown)")
    
    # Additional fields for state change timestamps
    state_timestamps: Optional[Dict[str, str]] = Field(
        default=None, description="Timestamps for each state change"
    )
    
    model_config = {
        "json_schema_extra": {
            "examples": [
                {
                    "job_id": "019bf590-1234-7890-abcd-ef1234567890",
                    "correlation_id": "corr-123456",
                    "job_state": "RUNNING",
                    "created_at": "2026-02-21T10:30:00Z",
                    "updated_at": "2026-02-21T10:35:00Z",
                    "tombstone": False,
                    "stages": [
                        {
                            "stage_name": "parse-catalog",
                            "stage_state": "COMPLETED",
                            "started_at": "2026-02-21T10:31:00Z",
                            "ended_at": "2026-02-21T10:32:30Z",
                            "error_code": None,
                            "error_summary": None
                        },
                        {
                            "stage_name": "create-local-repository",
                            "stage_state": "IN_PROGRESS",
                            "started_at": "2026-02-21T10:33:00Z",
                            "ended_at": None,
                            "error_code": None,
                            "error_summary": None
                        }
                    ],
                    "state_timestamps": {
                        "CREATED": "2026-02-21T10:30:00Z",
                        "IN_PROGRESS": "2026-02-21T10:31:00Z"
                    }
                }
            ]
        }
    }


class ErrorResponse(BaseModel):
    """Standard error response body."""
    error: str = Field(..., description="Error code")
    message: str = Field(..., description="Error message")
    correlation_id: str = Field(..., description="Request correlation ID")
    timestamp: str = Field(..., description="Error timestamp (ISO 8601)")

    @classmethod
    def create(cls, error: str, message: str, correlation_id: str) -> "ErrorResponse":
        """Convenience constructor with current UTC timestamp."""
        return cls(
            error=error,
            message=message,
            correlation_id=correlation_id,
            timestamp=datetime.utcnow().isoformat() + "Z",
        )


================================================
FILE: build_stream/api/local_repo/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

from api.local_repo.routes import router

__all__ = ["router"]


================================================
FILE: build_stream/api/local_repo/dependencies.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""FastAPI dependency providers for Local Repository API."""

from typing import Optional

from fastapi import Depends, Header, HTTPException, status
from sqlalchemy.orm import Session

from api.dependencies import (
    get_db_session,
    _create_sql_job_repo,
    _create_sql_stage_repo,
    _create_sql_audit_repo,
    _get_container,
    _ENV,
    verify_token,
)
from core.jobs.value_objects import ClientId, CorrelationId
from orchestrator.local_repo.use_cases import CreateLocalRepoUseCase


def _get_container():
    """Lazy import of container to avoid circular imports."""
    from container import container  # pylint: disable=import-outside-toplevel
    return container


def get_create_local_repo_use_case(
    db_session: Session = Depends(get_db_session),
) -> CreateLocalRepoUseCase:
    """Provide create local repo use case with shared session in prod."""
    if _ENV == "prod":
        container = _get_container()
        return CreateLocalRepoUseCase(
            job_repo=_create_sql_job_repo(db_session),
            stage_repo=_create_sql_stage_repo(db_session),
            audit_repo=_create_sql_audit_repo(db_session),
            input_file_service=container.input_file_service(),
            playbook_queue_service=container.playbook_queue_request_service(),
            uuid_generator=container.uuid_generator(),
        )
    return _get_container().create_local_repo_use_case()


def get_local_repo_correlation_id(
    x_correlation_id: Optional[str] = Header(
        default=None,
        alias="X-Correlation-Id",
        description="Request tracing ID",
    ),
) -> CorrelationId:
    """Return provided correlation ID or generate one."""
    generator = _get_container().uuid_generator()
    if x_correlation_id:
        try:
            return CorrelationId(x_correlation_id)
        except ValueError:
            pass

    generated_id = generator.generate()
    return CorrelationId(str(generated_id))


================================================
FILE: build_stream/api/local_repo/routes.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""FastAPI routes for local repository stage operations."""

from datetime import datetime, timezone
from typing import Annotated

from fastapi import APIRouter, Depends, HTTPException, status

from api.dependencies import verify_token, require_job_write
from api.local_repo.dependencies import (
    get_create_local_repo_use_case,
    get_local_repo_correlation_id,
)
from api.local_repo.schemas import CreateLocalRepoResponse, LocalRepoErrorResponse
from api.logging_utils import log_secure_info
from core.jobs.exceptions import (
    InvalidStateTransitionError,
    JobNotFoundError,
    TerminalStateViolationError,
    UpstreamStageNotCompletedError,
)
from core.jobs.value_objects import ClientId, CorrelationId, JobId
from core.localrepo.exceptions import (
    InputDirectoryInvalidError,
    InputFilesMissingError,
    LocalRepoDomainError,
    QueueUnavailableError,
)
from orchestrator.local_repo.commands import CreateLocalRepoCommand
from orchestrator.local_repo.use_cases import CreateLocalRepoUseCase

router = APIRouter(prefix="/jobs", tags=["Local Repository"])


def _build_error_response(
    error_code: str,
    message: str,
    correlation_id: str,
) -> LocalRepoErrorResponse:
    return LocalRepoErrorResponse(
        error=error_code,
        message=message,
        correlation_id=correlation_id,
        timestamp=datetime.now(timezone.utc).isoformat() + "Z",
    )


@router.post(
    "/{job_id}/stages/create-local-repository",
    response_model=CreateLocalRepoResponse,
    status_code=status.HTTP_202_ACCEPTED,
    summary="Create local repository",
    description="Trigger the create-local-repository stage for a job",
    responses={
        202: {"description": "Stage accepted", "model": CreateLocalRepoResponse},
        400: {"description": "Invalid request", "model": LocalRepoErrorResponse},
        401: {"description": "Unauthorized", "model": LocalRepoErrorResponse},
        403: {"description": "Forbidden - insufficient scope", "model": LocalRepoErrorResponse},
        404: {"description": "Job not found", "model": LocalRepoErrorResponse},
        409: {"description": "Stage conflict", "model": LocalRepoErrorResponse},
        500: {"description": "Internal error", "model": LocalRepoErrorResponse},
    },
)
def create_local_repository(
    job_id: str,
    token_data: Annotated[dict, Depends(verify_token)] = None,  # pylint: disable=unused-argument
    use_case: CreateLocalRepoUseCase = Depends(get_create_local_repo_use_case),
    correlation_id: CorrelationId = Depends(get_local_repo_correlation_id),
    _: None = Depends(require_job_write),
) -> CreateLocalRepoResponse:
    """Trigger the create-local-repository stage for a job.

    Accepts the request synchronously and returns 202 Accepted.
    The playbook execution is handled by the NFS queue watcher service.
    """
    # Extract client_id from validated token data
    client_id = ClientId(token_data["client_id"])

    log_secure_info(
        "info",
        f"Create local repo request: job_id={job_id}, correlation_id={correlation_id.value}",
        identifier=str(client_id.value),
        job_id=job_id,
    )

    try:
        validated_job_id = JobId(job_id)
    except ValueError as exc:
        raise HTTPException(
            status_code=status.HTTP_400_BAD_REQUEST,
            detail=_build_error_response(
                "INVALID_JOB_ID",
                f"Invalid job_id format: {job_id}",
                correlation_id.value,
            ).model_dump(),
        ) from exc

    try:
        command = CreateLocalRepoCommand(
            job_id=validated_job_id,
            client_id=client_id,
            correlation_id=correlation_id,
        )
        log_secure_info(
            "debug",
            f"Local repo executing: job_id={job_id}, client_id={client_id.value}, "
            f"correlation_id={correlation_id.value}",
            job_id=job_id,
        )
        result = use_case.execute(command)

        log_secure_info(
            "info",
            f"Local repo success: job_id={job_id}, "
            f"stage={result.stage_name}, stage_status={result.status}, status=202",
            job_id=job_id,
            end_section=True,
        )

        return CreateLocalRepoResponse(
            job_id=result.job_id,
            stage=result.stage_name,
            status=result.status,
            submitted_at=result.submitted_at,
            correlation_id=result.correlation_id,
        )

    except JobNotFoundError as exc:
        log_secure_info("warning", f"Local repo failed: job_id={job_id}, reason=job_not_found, status=404", job_id=job_id, end_section=True)
        raise HTTPException(
            status_code=status.HTTP_404_NOT_FOUND,
            detail=_build_error_response(
                "JOB_NOT_FOUND",
                exc.message,
                correlation_id.value,
            ).model_dump(),
        ) from exc

    except UpstreamStageNotCompletedError as exc:
        log_secure_info(
            "warning",
            f"Local repo failed: job_id={job_id}, reason=upstream_stage_not_completed, status=412",
            job_id=job_id,
            end_section=True,
        )
        raise HTTPException(
            status_code=status.HTTP_412_PRECONDITION_FAILED,
            detail=_build_error_response(
                "UPSTREAM_STAGE_NOT_COMPLETED",
                exc.message,
                correlation_id.value,
            ).model_dump(),
        ) from exc

    except InvalidStateTransitionError as exc:
        log_secure_info(
            "warning",
            f"Local repo failed: job_id={job_id}, reason=invalid_state_transition, status=409",
            job_id=job_id,
            end_section=True,
        )
        raise HTTPException(
            status_code=status.HTTP_409_CONFLICT,
            detail=_build_error_response(
                "INVALID_STATE_TRANSITION",
                exc.message,
                correlation_id.value,
            ).model_dump(),
        ) from exc

    except TerminalStateViolationError as exc:
        log_secure_info(
            "warning",
            f"Local repo failed: job_id={job_id}, reason=terminal_state, status=412",
            job_id=job_id,
            end_section=True,
        )
        if exc.state == "FAILED":
            message = f"Job {job_id} stage is in {exc.state} state and cannot be retried. Please create a new job to proceed."
        else:
            message = f"Job {job_id} stage is in {exc.state} state and cannot be modified."

        raise HTTPException(
            status_code=status.HTTP_412_PRECONDITION_FAILED,
            detail=_build_error_response(
                "TERMINAL_STATE_VIOLATION",
                message,
                correlation_id.value,
            ).model_dump(),
        ) from exc

    except InputFilesMissingError as exc:
        log_secure_info(
            "warning",
            f"Local repo failed: job_id={job_id}, reason=input_files_missing, status=400",
            job_id=job_id,
            end_section=True,
        )
        raise HTTPException(
            status_code=status.HTTP_400_BAD_REQUEST,
            detail=_build_error_response(
                "INPUT_FILES_MISSING",
                exc.message,
                correlation_id.value,
            ).model_dump(),
        ) from exc

    except InputDirectoryInvalidError as exc:
        log_secure_info(
            "warning",
            f"Local repo failed: job_id={job_id}, reason=input_directory_invalid, status=400",
            job_id=job_id,
            end_section=True,
        )
        raise HTTPException(
            status_code=status.HTTP_400_BAD_REQUEST,
            detail=_build_error_response(
                "INPUT_DIRECTORY_INVALID",
                exc.message,
                correlation_id.value,
            ).model_dump(),
        ) from exc

    except QueueUnavailableError as exc:
        log_secure_info(
            "error",
            f"Local repo failed: job_id={job_id}, reason=queue_unavailable, status=503",
            job_id=job_id,
            end_section=True,
        )
        raise HTTPException(
            status_code=status.HTTP_503_SERVICE_UNAVAILABLE,
            detail=_build_error_response(
                "QUEUE_UNAVAILABLE",
                exc.message,
                correlation_id.value,
            ).model_dump(),
        ) from exc

    except LocalRepoDomainError as exc:
        log_secure_info(
            "error",
            f"Local repo failed: job_id={job_id}, reason=domain_error, status=500",
            job_id=job_id,
            end_section=True,
        )
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail=_build_error_response(
                "LOCAL_REPO_ERROR",
                exc.message,
                correlation_id.value,
            ).model_dump(),
        ) from exc

    except Exception as exc:
        log_secure_info(
            "error",
            f"Local repo failed: job_id={job_id}, reason=unexpected_error, status=500",
            job_id=job_id,
            exc_info=True,
            end_section=True,
        )
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail=_build_error_response(
                "INTERNAL_ERROR",
                "An unexpected error occurred",
                correlation_id.value,
            ).model_dump(),
        ) from exc


================================================
FILE: build_stream/api/local_repo/schemas.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Pydantic schemas for Local Repository API requests and responses."""

from pydantic import BaseModel, Field


class CreateLocalRepoResponse(BaseModel):
    """Response model for local repository stage acceptance (202 Accepted)."""

    job_id: str = Field(..., description="Job identifier")
    stage: str = Field(..., description="Stage identifier")
    status: str = Field(..., description="Acceptance status")
    submitted_at: str = Field(..., description="Submission timestamp (ISO 8601)")
    correlation_id: str = Field(..., description="Correlation identifier")


class LocalRepoErrorResponse(BaseModel):
    """Standard error response body for local repository operations."""

    error: str = Field(..., description="Error code")
    message: str = Field(..., description="Error message")
    correlation_id: str = Field(..., description="Request correlation ID")
    timestamp: str = Field(..., description="Error timestamp (ISO 8601)")


================================================
FILE: build_stream/api/logging_utils.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Secure logging utilities for Build Stream API.

Provides per-job file logging with automatic redaction of sensitive data
(IP addresses, JWT tokens, passwords, API keys, emails) so that job log
files never contain exploitable information.
"""

import logging
import re
import traceback
from pathlib import Path
from typing import Dict, Optional

_LOG_FORMATTER = logging.Formatter(
    "%(asctime)s - %(name)s - %(levelname)s - %(message)s"
)

_LOG_BASE = Path("/opt/omnia/log/build_stream")

_job_loggers: Dict[str, logging.Logger] = {}

# ---------------------------------------------------------------------------
# Sensitive-data redaction patterns
# ---------------------------------------------------------------------------
_SENSITIVE_PATTERNS = [
    # IPv4 addresses  (e.g. 192.168.1.100)
    (re.compile(r"\b(?:\d{1,3}\.){3}\d{1,3}\b"), "<REDACTED_IP>"),
    # IPv6 addresses  (simplified – colon-hex groups)
    (re.compile(r"\b(?:[0-9a-fA-F]{1,4}:){2,7}[0-9a-fA-F]{1,4}\b"), "<REDACTED_IP>"),
    # JWT / Bearer tokens  (three base64url segments separated by dots)
    (re.compile(r"eyJ[A-Za-z0-9_-]+\.[A-Za-z0-9_-]+\.[A-Za-z0-9_-]+"), "<REDACTED_TOKEN>"),
    # Authorization header values
    (re.compile(r"(?i)(bearer\s+)[A-Za-z0-9_\-\.]+"), r"\1<REDACTED_TOKEN>"),
    # password= or passwd= or secret= or api_key= or token= values
    (re.compile(
        r"(?i)((?:password|passwd|secret|api_key|apikey|token|auth_token)"
        r"\s*[=:]\s*)[^\s,;\"']+"
    ), r"\1<REDACTED>"),
    # Email addresses
    (re.compile(r"\b[A-Za-z0-9._%+-]+@[A-Za-z0-9.-]+\.[A-Z|a-z]{2,}\b"), "<REDACTED_EMAIL>"),
]


def _sanitize_message(message: str) -> str:
    """Redact sensitive data from a log message."""
    for pattern, replacement in _SENSITIVE_PATTERNS:
        message = pattern.sub(replacement, message)
    return message


# ---------------------------------------------------------------------------
# Job log-file lifecycle
# ---------------------------------------------------------------------------
def create_job_log_file(job_id: str) -> Optional[Path]:
    """Create ``<LOG_BASE>/<job_id>/<job_id>.log`` and warm the cached logger.

    Called once from the create-job API.  Subsequent calls to
    :func:`log_secure_info` with the same *job_id* will append to this file.

    Returns:
        Path to the created log file, or ``None`` on failure.
    """
    job_log_dir = _LOG_BASE / job_id
    try:
        job_log_dir.mkdir(parents=True, exist_ok=True)
        log_file = job_log_dir / f"{job_id}.log"
        log_file.touch(exist_ok=True)
        _get_or_create_job_logger(job_id, log_file)
        return log_file
    except OSError:
        logging.getLogger(__name__).warning(
            "Failed to create job log directory/file for job: %s", job_id
        )
        return None


def remove_job_logger(job_id: str) -> None:
    """Flush, close, and remove the cached logger for *job_id*."""
    job_logger = _job_loggers.pop(job_id, None)
    if job_logger is None:
        return
    for handler in list(job_logger.handlers):
        handler.flush()
        handler.close()
        job_logger.removeHandler(handler)


# ---------------------------------------------------------------------------
# Internal helpers
# ---------------------------------------------------------------------------
def _get_job_log_file(job_id: str) -> Optional[Path]:
    """Return the Path to the job log file if the directory exists."""
    log_file = _LOG_BASE / job_id / f"{job_id}.log"
    if log_file.parent.is_dir():
        return log_file
    return None


def _get_or_create_job_logger(
    job_id: str, log_file: Optional[Path] = None
) -> Optional[logging.Logger]:
    """Return a cached per-job logger, creating one if necessary."""
    if job_id in _job_loggers:
        return _job_loggers[job_id]

    if log_file is None:
        log_file = _get_job_log_file(job_id)
    if log_file is None:
        return None

    try:
        job_logger = logging.getLogger(f"build_stream.job.{job_id}")
        job_logger.setLevel(logging.DEBUG)
        job_logger.propagate = False
        handler = logging.FileHandler(str(log_file), mode="a")
        handler.setLevel(logging.DEBUG)
        handler.setFormatter(_LOG_FORMATTER)
        job_logger.addHandler(handler)
        _job_loggers[job_id] = job_logger
        return job_logger
    except OSError:
        return None


# ---------------------------------------------------------------------------
# Auth log file (singleton)
# ---------------------------------------------------------------------------
_auth_logger: Optional[logging.Logger] = None


def _get_or_create_auth_logger() -> Optional[logging.Logger]:
    """Return the cached auth logger, creating it on first call.

    Writes to ``<LOG_BASE>/auth.log``.
    """
    global _auth_logger  # pylint: disable=global-statement
    if _auth_logger is not None:
        return _auth_logger

    try:
        _LOG_BASE.mkdir(parents=True, exist_ok=True)
        log_file = _LOG_BASE / "auth.log"
        log_file.touch(exist_ok=True)

        auth_logger = logging.getLogger("build_stream.auth")
        auth_logger.setLevel(logging.DEBUG)
        auth_logger.propagate = False
        handler = logging.FileHandler(str(log_file), mode="a")
        handler.setLevel(logging.DEBUG)
        handler.setFormatter(_LOG_FORMATTER)
        auth_logger.addHandler(handler)
        _auth_logger = auth_logger
        return _auth_logger
    except OSError:
        logging.getLogger(__name__).warning("Failed to create auth log file")
        return None


_SEPARATOR = "-" * 80


def log_auth_info(
    level: str,
    message: str,
    exc_info: bool = False,
    end_section: bool = False,
) -> None:
    """Log an auth/register event to ``<LOG_BASE>/auth.log``.

    Sensitive data is automatically redacted before writing.

    Args:
        level: ``'info'``, ``'warning'``, ``'error'``, ``'debug'``, or ``'critical'``.
        message: Human-readable log message.
        exc_info: Append the current exception traceback.
        end_section: Append a separator line to visually delimit this execution.
    """
    logger = logging.getLogger(__name__)

    log_message = message
    if exc_info:
        log_message = f"{log_message}\n{traceback.format_exc().rstrip()}"

    log_message = _sanitize_message(log_message)

    log_func = getattr(logger, level, logger.info)
    log_func(log_message)

    auth_logger = _get_or_create_auth_logger()
    if auth_logger:
        auth_log_func = getattr(auth_logger, level, auth_logger.info)
        auth_log_func(log_message)
        if end_section:
            auth_logger.info(_SEPARATOR)


# ---------------------------------------------------------------------------
# Public logging entry point (per-job)
# ---------------------------------------------------------------------------
def log_secure_info(
    level: str,
    message: str,
    identifier: Optional[str] = None,
    job_id: Optional[str] = None,
    exc_info: bool = False,
    end_section: bool = False,
) -> None:
    """Log a message after redacting sensitive data.

    * *identifier* is truncated to its first 8 characters.
    * IP addresses, JWT tokens, passwords, API keys, and emails are
      automatically replaced with ``<REDACTED_*>`` placeholders.
    * When *job_id* is supplied the entry is also written to the
      per-job log file.

    Args:
        level: ``'info'``, ``'warning'``, ``'error'``, ``'debug'``, or ``'critical'``.
        message: Human-readable log message.
        identifier: Optional opaque id — only the first 8 chars are kept.
        job_id: Route the entry to the job-specific log file.
        exc_info: Append the current exception traceback.
        end_section: Append a separator line to visually delimit this execution.
    """
    logger = logging.getLogger(__name__)

    if identifier:
        log_message = f"{message}: {identifier[:8]}..."
    else:
        log_message = message

    if exc_info:
        log_message = f"{log_message}\n{traceback.format_exc().rstrip()}"

    log_message = _sanitize_message(log_message)

    log_func = getattr(logger, level, logger.info)
    log_func(log_message)

    if job_id:
        job_logger = _get_or_create_job_logger(job_id)
        if job_logger:
            job_log_func = getattr(job_logger, level, job_logger.info)
            job_log_func(log_message)
            if end_section:
                job_logger.info(_SEPARATOR)


================================================
FILE: build_stream/api/parse_catalog/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""ParseCatalog API module."""

from api.parse_catalog.routes import router

__all__ = ["router"]


================================================
FILE: build_stream/api/parse_catalog/dependencies.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""FastAPI dependency providers for ParseCatalog API.

This module provides parse-catalog-specific dependencies like the
parse catalog use case provider.
"""

from fastapi import Depends
from sqlalchemy.orm import Session

from api.dependencies import (
    get_db_session,
    _create_sql_job_repo,
    _create_sql_stage_repo,
    _create_sql_audit_repo,
    _get_container,
    _ENV,
)
from orchestrator.catalog.use_cases import ParseCatalogUseCase


# ------------------------------------------------------------------
# Parse-catalog-specific dependency providers
# ------------------------------------------------------------------
def get_parse_catalog_use_case(
    db_session: Session = Depends(get_db_session),
) -> ParseCatalogUseCase:
    """Provide parse-catalog use case with shared session in prod."""
    if _ENV == "prod":
        from infra.db.repositories import SqlArtifactMetadataRepository
        
        container = _get_container()
        return ParseCatalogUseCase(
            job_repo=_create_sql_job_repo(db_session),
            stage_repo=_create_sql_stage_repo(db_session),
            audit_repo=_create_sql_audit_repo(db_session),
            artifact_store=container.artifact_store(),
            artifact_metadata_repo=SqlArtifactMetadataRepository(db_session),
            uuid_generator=container.uuid_generator(),
        )
    return _get_container().parse_catalog_use_case()


================================================
FILE: build_stream/api/parse_catalog/routes.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""FastAPI routes for ParseCatalog API."""

from typing import Annotated

from fastapi import APIRouter, Depends, File, HTTPException, UploadFile, status

from api.dependencies import require_catalog_read, verify_token, mark_stage_as_failed, get_db_session
from api.parse_catalog.dependencies import get_parse_catalog_use_case
from api.parse_catalog.schemas import ErrorResponse, ParseCatalogResponse, ParseCatalogStatus
from api.parse_catalog.service import (
    InvalidFileFormatError,
    InvalidJSONError,
    ParseCatalogService,
)
from core.catalog.exceptions import (
    CatalogParseError,
)
from api.logging_utils import log_secure_info
from core.jobs.exceptions import (
    InvalidStateTransitionError,
    JobNotFoundError,
    StageAlreadyCompletedError,
    TerminalStateViolationError,
)

router = APIRouter(prefix="/jobs", tags=["Catalog Parsing"])


@router.post(
    "/{job_id}/stages/parse-catalog",
    response_model=ParseCatalogResponse,
    status_code=status.HTTP_200_OK,
    summary="Parse a catalog file",
    description="Upload a catalog JSON file to parse and generate output files.",
    responses={
        200: {
            "description": "Catalog parsed successfully",
            "model": ParseCatalogResponse,
        },
        400: {
            "description": "Invalid request (bad file format or JSON)",
            "model": ErrorResponse,
        },
        401: {
            "description": "Unauthorized (missing or invalid token)",
            "model": ErrorResponse,
        },
        403: {
            "description": "Forbidden (insufficient scope)",
            "model": ErrorResponse,
        },
        422: {
            "description": "Validation error",
            "model": ErrorResponse,
        },
        500: {
            "description": "Internal server error during processing",
            "model": ErrorResponse,
        },
    },
)
async def parse_catalog(
    job_id: str,
    file: UploadFile = File(..., description="The catalog JSON file to parse"),
    token_data: Annotated[dict, Depends(verify_token)] = None,  # pylint: disable=unused-argument
    scope_data: Annotated[dict, Depends(require_catalog_read)] = None,  # pylint: disable=unused-argument
    parse_catalog_use_case = Depends(get_parse_catalog_use_case),
    db_session = Depends(get_db_session),
) -> ParseCatalogResponse:
    """Parse a catalog from an uploaded JSON file.

    This endpoint accepts a catalog JSON file, validates its format and content,
    then processes it to generate the required output files. Requires a valid
    JWT token and 'catalog:read' scope.

    Args:
        job_id: The job identifier for the parsing operation.
        file: The uploaded JSON file containing catalog data.
        token_data: Validated token data from JWT (injected by dependency).
        scope_data: Token data with validated scope (injected by dependency).

    Returns:
        ParseCatalogResponse with status and message.

    Raises:
        HTTPException: With appropriate status code on failure.
    """
    try:
        contents = await file.read()
        log_secure_info(
            "info",
            f"Parse-catalog request: job_id={job_id}, "
            f"filename={file.filename}, size_bytes={len(contents)}",
            job_id=job_id,
        )

        # Create service with injected use case
        service = ParseCatalogService(parse_catalog_use_case=parse_catalog_use_case)

        result = await service.parse_catalog(
            filename=file.filename or "unknown.json",
            contents=contents,
            job_id=job_id,  # Pass job_id to service
        )

        log_secure_info(
            "info",
            f"Parse-catalog success: job_id={job_id}, status=200",
            job_id=job_id,
            end_section=True,
        )
        response_data = {
            "status": ParseCatalogStatus.SUCCESS.value,
            "message": result.message,
        }
        return response_data

    except ValueError as e:
        # Handle job_id format validation errors
        error_msg = str(e)
        if "Invalid UUID format" in error_msg or "Invalid job_id format" in error_msg:
            log_secure_info("warning", f"Parse-catalog failed: job_id={job_id}, reason=invalid_job_id, status=400", job_id=job_id, end_section=True)
            raise HTTPException(
                status_code=status.HTTP_400_BAD_REQUEST,
                detail={
                    "error_code": "VALIDATION_ERROR",
                    "message": f"Invalid job_id format: {job_id}",
                    "correlation_id": "test-correlation-id"
                },
            ) from e

        # Re-raise other ValueError as internal error
        log_secure_info("error", f"Parse-catalog failed: job_id={job_id}, reason=unexpected_value_error, status=500", job_id=job_id, exc_info=True, end_section=True)
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail={
                "error_code": "INTERNAL_ERROR",
                "message": "An unexpected error occurred",
                "correlation_id": "test-correlation-id"
            },
        ) from e

    except JobNotFoundError as e:
        log_secure_info("warning", f"Parse-catalog failed: job_id={job_id}, reason=job_not_found, status=404", job_id=job_id, end_section=True)
        raise HTTPException(
            status_code=status.HTTP_404_NOT_FOUND,
            detail={
                "error_code": "JOB_NOT_FOUND",
                "message": f"Job not found: {job_id}",
                "correlation_id": "test-correlation-id"
            },
        ) from e

    except TerminalStateViolationError as e:
        log_secure_info("warning", f"Parse-catalog failed: job_id={job_id}, reason=terminal_state, status=412", job_id=job_id, end_section=True)
        raise HTTPException(
            status_code=status.HTTP_412_PRECONDITION_FAILED,
            detail={
                "error_code": "PRECONDITION_FAILED",
                "message": f"Job is in terminal state: {job_id}",
                "correlation_id": "test-correlation-id"
            },
        ) from e

    except StageAlreadyCompletedError as e:
        log_secure_info("warning", f"Parse-catalog failed: job_id={job_id}, reason=stage_already_completed, status=409", job_id=job_id, end_section=True)
        raise HTTPException(
            status_code=status.HTTP_409_CONFLICT,
            detail={
                "error_code": "STAGE_ALREADY_COMPLETED",
                "message": f"Parse catalog stage already completed for job: {job_id}",
                "correlation_id": "test-correlation-id"
            },
        ) from e

    except InvalidStateTransitionError as e:
        log_secure_info("warning", f"Parse-catalog failed: job_id={job_id}, reason=invalid_state_transition, status=409", job_id=job_id, end_section=True)
        raise HTTPException(
            status_code=status.HTTP_409_CONFLICT,
            detail={
                "error_code": "INVALID_STATE_TRANSITION",
                "message": str(e),
                "correlation_id": "test-correlation-id"
            },
        ) from e

    except InvalidFileFormatError as e:
        log_secure_info("warning", f"Parse-catalog failed: job_id={job_id}, reason=invalid_file_format, status=400", job_id=job_id, end_section=True)
        # Mark stage as failed since validation failed at API layer
        mark_stage_as_failed(job_id, "parse-catalog", "INVALID_FILE_FORMAT", str(e), db_session)
        raise HTTPException(
            status_code=status.HTTP_400_BAD_REQUEST,
            detail={
                "error_code": "INVALID_FILE_FORMAT",
                "message": str(e),
                "correlation_id": "test-correlation-id"
            },
        ) from e

    except InvalidJSONError as e:
        log_secure_info("warning", f"Parse-catalog failed: job_id={job_id}, reason=invalid_json, status=400", job_id=job_id, end_section=True)
        # Mark stage as failed since validation failed at API layer
        mark_stage_as_failed(job_id, "parse-catalog", "INVALID_JSON", str(e), db_session)
        raise HTTPException(
            status_code=status.HTTP_400_BAD_REQUEST,
            detail={
                "error_code": "INVALID_JSON",
                "message": str(e),
                "correlation_id": "test-correlation-id"
            },
        ) from e

    except CatalogParseError as e:
        log_secure_info("error", f"Parse-catalog failed: job_id={job_id}, reason=catalog_parse_error, status=500", job_id=job_id, end_section=True)
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail={
                "error_code": "CATALOG_PARSE_ERROR",
                "message": str(e),
                "correlation_id": "test-correlation-id"
            },
        ) from e

    except Exception as e:
        log_secure_info("error", f"Parse-catalog failed: job_id={job_id}, reason=unexpected_error, status=500", job_id=job_id, exc_info=True, end_section=True)
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail={
                "error_code": "INTERNAL_ERROR",
                "message": "An unexpected error occurred",
                "correlation_id": "test-correlation-id"
            },
        ) from e


================================================
FILE: build_stream/api/parse_catalog/schemas.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Pydantic schemas for ParseCatalog API request and response models."""

from enum import Enum
from typing import Optional

from pydantic import BaseModel, Field


class ParseCatalogStatus(str, Enum):
    """Status enum for ParseCatalog API responses."""

    SUCCESS = "success"
    ERROR = "error"


class ParseCatalogResponse(BaseModel):  # pylint: disable=too-few-public-methods
    """Response model for ParseCatalog API."""

    status: ParseCatalogStatus = Field(
        ...,
        description="Status of the catalog parsing operation",
    )
    message: str = Field(
        ...,
        description="Human-readable message describing the result",
    )

    model_config = {
        "json_schema_extra": {
            "examples": [
                {
                    "status": "success",
                    "message": "Catalog parsed successfully",
                },
                {
                    "status": "error",
                    "message": "Invalid file format. Only JSON files are accepted.",
                },
            ]
        }
    }


class ErrorResponse(BaseModel):  # pylint: disable=too-few-public-methods
    """Standard error response model."""

    status: ParseCatalogStatus = ParseCatalogStatus.ERROR
    message: str = Field(..., description="Error message describing what went wrong")
    detail: Optional[str] = Field(
        default=None,
        description="Additional error details (only in non-production environments)",
    )


================================================
FILE: build_stream/api/parse_catalog/service.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Business logic service for ParseCatalog API."""

import json
import logging
import os
import tempfile
from dataclasses import dataclass
from pathlib import Path
from typing import Optional

from core.catalog.generator import generate_root_json_from_catalog
from common.config import load_config
from core.jobs.value_objects import CorrelationId, JobId
from infra.id_generator import UUIDv4Generator
from orchestrator.catalog.commands.parse_catalog import ParseCatalogCommand

logger = logging.getLogger(__name__)


class CatalogParseError(Exception):
    """Exception raised when catalog parsing fails."""


class InvalidFileFormatError(CatalogParseError):
    """Exception raised when the uploaded file has an invalid format."""


class InvalidJSONError(CatalogParseError):
    """Exception raised when the JSON content is invalid."""


@dataclass
class ParseResult:
    """Result of a catalog parse operation."""

    success: bool
    message: str


class ParseCatalogService:  # pylint: disable=too-few-public-methods
    """Service for parsing catalog files."""

    def __init__(self, parse_catalog_use_case=None, output_root: Optional[str] = None):
        """Initialize the ParseCatalog service.

        Args:
            parse_catalog_use_case: The use case for parsing catalogs (injected).
            output_root: Root directory for generated output files.
                        If None, uses working_dir from config.
        """
        self.parse_catalog_use_case = parse_catalog_use_case
        if output_root is None:
            try:
                config = load_config()
                working_dir = Path(config.artifact_store.working_dir)
                working_dir.mkdir(parents=True, exist_ok=True)
                self.output_root = str(working_dir / "tmp" / "generator")
            except (FileNotFoundError, ValueError):
                self.output_root = "/tmp/build_stream/tmp/generator"
        else:
            self.output_root = output_root

        Path(self.output_root).mkdir(parents=True, exist_ok=True)

    async def parse_catalog(
        self,
        filename: str,
        contents: bytes,
        job_id: str,
    ) -> ParseResult:
        """Parse a catalog from uploaded file contents.

        Args:
            filename: Name of the uploaded file.
            contents: Raw bytes content of the uploaded file.
            job_id: The job identifier for the orchestrator.

        Returns:
            ParseResult containing the operation status and details.

        Raises:
            InvalidFileFormatError: If file is not a JSON file.
            InvalidJSONError: If JSON content is malformed or not a dict.
            CatalogParseError: If catalog processing fails.
        """
        logger.info("Starting catalog parse for file: %s", filename)

        # Note: Job validation is handled by the orchestrator use case
        self._validate_file_format(filename)
        json_data = self._parse_json_content(contents)
        self._validate_json_structure(json_data)

        return await self._process_catalog_via_orchestrator(json_data, job_id)

    async def _process_catalog_via_orchestrator(self, json_data: dict, job_id: str) -> ParseResult:
        """Process catalog using the orchestrator use case."""
        # Create command for orchestrator
        uuid_gen = UUIDv4Generator()

        # Convert json_data back to bytes as expected by orchestrator
        json_bytes = json.dumps(json_data).encode('utf-8')

        command = ParseCatalogCommand(
            job_id=JobId(job_id),
            correlation_id=CorrelationId(str(uuid_gen.generate())),
            filename="uploaded.json",
            content=json_bytes,
        )

        # Execute via orchestrator use case (injected, not from container)
        if self.parse_catalog_use_case is None:
            # Fallback to container if not injected (for backward compatibility)
            from container import container  # pylint: disable=import-outside-toplevel
            use_case = container.parse_catalog_use_case()
        else:
            use_case = self.parse_catalog_use_case
            
        result = use_case.execute(command)

        # Convert orchestrator result to API result
        return ParseResult(
            success=True,
            message=result.message,
        )

    def _validate_file_format(self, filename: str) -> None:
        """Validate that the file has a .json extension."""
        if not filename.endswith(".json"):
            logger.warning("Invalid file format received: %s", filename)
            raise InvalidFileFormatError(
                "Invalid file format. Only JSON files are accepted."
            )

    def _parse_json_content(self, contents: bytes) -> dict:
        """Parse JSON content from bytes."""
        try:
            return json.loads(contents.decode("utf-8"))
        except json.JSONDecodeError as e:
            logger.error("Failed to parse JSON content")
            raise InvalidJSONError(f"Invalid JSON data: {e.msg}") from e
        except UnicodeDecodeError as e:
            logger.error("Failed to decode file content as UTF-8")
            raise InvalidJSONError("File content is not valid UTF-8 text") from e

    def _validate_json_structure(self, json_data: object) -> None:
        """Validate that JSON data is a dictionary."""
        if not isinstance(json_data, dict):
            logger.warning("JSON data is not a dictionary")
            raise InvalidJSONError(
                "Invalid JSON data. The data must be a dictionary."
            )

    async def _process_catalog(self, json_data: dict) -> ParseResult:
        """Process the catalog data and generate output files.

        Args:
            json_data: Validated catalog data as a dictionary.

        Returns:
            ParseResult with success status and output path.

        Raises:
            CatalogParseError: If processing fails.
        """
        temp_file_path = None
        try:
            temp_file_path = self._write_temp_file(json_data)
            logger.debug("Wrote catalog to temporary file: %s", temp_file_path)

            generate_root_json_from_catalog(
                catalog_path=temp_file_path,
                output_root=self.output_root,
            )

            logger.info("Catalog parsed successfully, output at: %s", self.output_root)
            return ParseResult(
                success=True,
                message="Catalog parsed successfully",
            )

        except FileNotFoundError as e:
            logger.error("Required file not found during processing")
            raise CatalogParseError("Required file not found during processing") from e
        except Exception as e:
            logger.error("Catalog processing failed")
            raise CatalogParseError("Failed to process catalog") from e
        finally:
            if temp_file_path and os.path.exists(temp_file_path):
                os.unlink(temp_file_path)
                logger.debug("Cleaned up temporary file: %s", temp_file_path)

    def _write_temp_file(self, json_data: dict) -> str:
        """Write JSON data to a temporary file.

        Args:
            json_data: Data to write to the file.

        Returns:
            Path to the temporary file.
        """
        with tempfile.NamedTemporaryFile(
            mode="w",
            suffix=".json",
            delete=False,
            encoding="utf-8",
        ) as f:
            json.dump(json_data, f)
            return f.name


================================================
FILE: build_stream/api/router.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""API router that aggregates all API modules."""

from fastapi import APIRouter

from api.auth.routes import router as auth_router
from api.jobs.routes import router as jobs_router
from api.parse_catalog.routes import router as parse_catalog_router
from api.catalog_roles.routes import router as catalog_roles_router
from api.generate_input_files.routes import router as generate_input_files_router
from api.local_repo.routes import router as local_repo_router
from api.build_image.routes import router as build_image_router
from api.validate.routes import router as validate_router

api_router = APIRouter(prefix="/api/v1")

api_router.include_router(auth_router)
api_router.include_router(jobs_router)
api_router.include_router(parse_catalog_router)
api_router.include_router(catalog_roles_router)
api_router.include_router(generate_input_files_router)
api_router.include_router(local_repo_router)
api_router.include_router(build_image_router)
api_router.include_router(validate_router)


================================================
FILE: build_stream/api/validate/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""ValidateImageOnTest API module."""

__all__ = []


================================================
FILE: build_stream/api/validate/dependencies.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""FastAPI dependency providers for ValidateImageOnTest API."""

from typing import Optional

from fastapi import Depends, Header
from sqlalchemy.orm import Session

from api.dependencies import (
    get_db_session,
    _create_sql_job_repo,
    _create_sql_stage_repo,
    _create_sql_audit_repo,
    _get_container,
    _ENV,
)
from core.jobs.value_objects import CorrelationId
from orchestrator.validate.use_cases import ValidateImageOnTestUseCase


def _get_container():
    """Lazy import of container to avoid circular imports."""
    from container import container  # pylint: disable=import-outside-toplevel
    return container


def get_validate_image_on_test_use_case(
    db_session: Session = Depends(get_db_session),
) -> ValidateImageOnTestUseCase:
    """Provide validate-image-on-test use case with shared session in prod."""
    if _ENV == "prod":
        container = _get_container()
        return ValidateImageOnTestUseCase(
            job_repo=_create_sql_job_repo(db_session),
            stage_repo=_create_sql_stage_repo(db_session),
            audit_repo=_create_sql_audit_repo(db_session),
            queue_service=container.validate_queue_service(),
            uuid_generator=container.uuid_generator(),
        )
    return _get_container().validate_image_on_test_use_case()


def get_validate_correlation_id(
    x_correlation_id: Optional[str] = Header(
        default=None,
        alias="X-Correlation-Id",
        description="Request tracing ID",
    ),
) -> CorrelationId:
    """Return provided correlation ID or generate one."""
    generator = _get_container().uuid_generator()
    if x_correlation_id:
        try:
            return CorrelationId(x_correlation_id)
        except ValueError:
            pass

    generated_id = generator.generate()
    return CorrelationId(str(generated_id))


================================================
FILE: build_stream/api/validate/routes.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""FastAPI routes for validate-image-on-test stage operations."""

import logging
from datetime import datetime, timezone

from fastapi import APIRouter, Depends, HTTPException, status

from api.validate.dependencies import (
    get_validate_image_on_test_use_case,
    get_validate_correlation_id,
)
from api.dependencies import verify_token, require_job_write
from api.validate.schemas import (
    ValidateImageOnTestRequest,
    ValidateImageOnTestResponse,
    ValidateImageOnTestErrorResponse,
)
from api.logging_utils import log_secure_info
from core.jobs.exceptions import (
    InvalidStateTransitionError,
    JobNotFoundError,
    UpstreamStageNotCompletedError,
)
from core.jobs.value_objects import ClientId, CorrelationId, JobId
from core.validate.exceptions import (
    StageGuardViolationError,
    ValidateDomainError,
    ValidationExecutionError,
)
from orchestrator.validate.commands import ValidateImageOnTestCommand
from orchestrator.validate.use_cases import ValidateImageOnTestUseCase

logger = logging.getLogger(__name__)

router = APIRouter(prefix="/jobs", tags=["Validate Image On Test"])


def _build_error_response(
    error_code: str,
    message: str,
    correlation_id: str,
) -> ValidateImageOnTestErrorResponse:
    return ValidateImageOnTestErrorResponse(
        error=error_code,
        message=message,
        correlation_id=correlation_id,
        timestamp=datetime.now(timezone.utc).isoformat() + "Z",
    )


@router.post(
    "/{job_id}/stages/validate-image-on-test",
    response_model=ValidateImageOnTestResponse,
    status_code=status.HTTP_202_ACCEPTED,
    summary="Validate image on test environment",
    description="Trigger the validate-image-on-test stage for a job",
    responses={
        202: {"description": "Stage accepted", "model": ValidateImageOnTestResponse},
        400: {"description": "Invalid request", "model": ValidateImageOnTestErrorResponse},
        401: {"description": "Unauthorized", "model": ValidateImageOnTestErrorResponse},
        404: {"description": "Job not found", "model": ValidateImageOnTestErrorResponse},
        409: {"description": "Stage conflict", "model": ValidateImageOnTestErrorResponse},
        412: {"description": "Stage guard violation", "model": ValidateImageOnTestErrorResponse},
        500: {"description": "Internal error", "model": ValidateImageOnTestErrorResponse},
    },
)
def create_validate_image_on_test(
    job_id: str,
    request_body: ValidateImageOnTestRequest,
    token_data: dict = Depends(verify_token),
    use_case: ValidateImageOnTestUseCase = Depends(get_validate_image_on_test_use_case),
    correlation_id: CorrelationId = Depends(get_validate_correlation_id),
    _: None = Depends(require_job_write),
) -> ValidateImageOnTestResponse:
    """Trigger the validate-image-on-test stage for a job.

    Accepts the request synchronously and returns 202 Accepted.
    The playbook execution is handled by the NFS queue watcher service.
    """
    # Extract client_id from token_data
    client_id = ClientId(token_data["client_id"])
    
    logger.info(
        "Validate image on test request: job_id=%s, client_id=%s, correlation_id=%s, image_key=%s",
        job_id,
        client_id.value,
        correlation_id.value,
        request_body.image_key,
    )

    try:
        validated_job_id = JobId(job_id)
    except ValueError as exc:
        raise HTTPException(
            status_code=status.HTTP_400_BAD_REQUEST,
            detail=_build_error_response(
                "INVALID_JOB_ID",
                f"Invalid job_id format: {job_id}",
                correlation_id.value,
            ).model_dump(),
        ) from exc

    try:
        command = ValidateImageOnTestCommand(
            job_id=validated_job_id,
            client_id=client_id,
            correlation_id=correlation_id,
            image_key=request_body.image_key,
        )
        result = use_case.execute(command)

        return ValidateImageOnTestResponse(
            job_id=result.job_id,
            stage=result.stage_name,
            status=result.status,
            submitted_at=result.submitted_at,
            correlation_id=result.correlation_id,
        )

    except JobNotFoundError as exc:
        logger.warning("Job not found: %s", job_id)
        raise HTTPException(
            status_code=status.HTTP_404_NOT_FOUND,
            detail=_build_error_response(
                "JOB_NOT_FOUND",
                exc.message,
                correlation_id.value,
            ).model_dump(),
        ) from exc

    except InvalidStateTransitionError as exc:
        log_secure_info(
            "warning",
            f"Invalid state transition for job {job_id}",
            str(correlation_id.value),
        )
        raise HTTPException(
            status_code=status.HTTP_409_CONFLICT,
            detail=_build_error_response(
                "INVALID_STATE_TRANSITION",
                exc.message,
                correlation_id.value,
            ).model_dump(),
        ) from exc

    except UpstreamStageNotCompletedError as exc:
        log_secure_info(
            "warning",
            f"Validate failed: job_id={job_id}, reason=upstream_stage_not_completed, status=412",
            str(correlation_id.value),
        )
        raise HTTPException(
            status_code=status.HTTP_412_PRECONDITION_FAILED,
            detail=_build_error_response(
                "UPSTREAM_STAGE_NOT_COMPLETED",
                exc.message,
                correlation_id.value,
            ).model_dump(),
        ) from exc

    except StageGuardViolationError as exc:
        log_secure_info(
            "warning",
            f"Stage guard violation for job {job_id}",
            str(correlation_id.value),
        )
        raise HTTPException(
            status_code=status.HTTP_412_PRECONDITION_FAILED,
            detail=_build_error_response(
                "STAGE_GUARD_VIOLATION",
                exc.message,
                correlation_id.value,
            ).model_dump(),
        ) from exc

    except ValidationExecutionError as exc:
        log_secure_info(
            "error",
            f"Validation execution error for job {job_id}",
            str(correlation_id.value),
        )
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail=_build_error_response(
                "VALIDATION_EXECUTION_ERROR",
                exc.message,
                correlation_id.value,
            ).model_dump(),
        ) from exc

    except ValidateDomainError as exc:
        log_secure_info(
            "error",
            f"Validate domain error for job {job_id}",
            str(correlation_id.value),
        )
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail=_build_error_response(
                "VALIDATE_ERROR",
                exc.message,
                correlation_id.value,
            ).model_dump(),
        ) from exc

    except Exception as exc:
        logger.exception("Unexpected error creating validate-image-on-test stage")
        raise HTTPException(
            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
            detail=_build_error_response(
                "INTERNAL_ERROR",
                "An unexpected error occurred",
                correlation_id.value,
            ).model_dump(),
        ) from exc


================================================
FILE: build_stream/api/validate/schemas.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Pydantic schemas for ValidateImageOnTest API requests and responses."""

from pydantic import BaseModel, Field


class ValidateImageOnTestRequest(BaseModel):
    """Request model for validate-image-on-test stage."""

    image_key: str = Field(..., description="Image key to validate")


class ValidateImageOnTestResponse(BaseModel):
    """Response model for validate-image-on-test stage acceptance (202 Accepted)."""

    job_id: str = Field(..., description="Job identifier")
    stage: str = Field(..., description="Stage identifier")
    status: str = Field(..., description="Acceptance status")
    submitted_at: str = Field(..., description="Submission timestamp (ISO 8601)")
    correlation_id: str = Field(..., description="Correlation identifier")


class ValidateImageOnTestErrorResponse(BaseModel):
    """Standard error response body for validate-image-on-test operations."""

    error: str = Field(..., description="Error code")
    message: str = Field(..., description="Error message")
    correlation_id: str = Field(..., description="Request correlation ID")
    timestamp: str = Field(..., description="Error timestamp (ISO 8601)")


================================================
FILE: build_stream/api/vault_client.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Ansible Vault client for secure credential storage and retrieval."""

import logging
import os
import subprocess
import tempfile
from typing import Any, Dict, Optional

import yaml

logger = logging.getLogger(__name__)


class VaultError(Exception):
    """Base exception for vault operations."""


class VaultDecryptError(VaultError):
    """Exception raised when vault decryption fails."""


class VaultEncryptError(VaultError):
    """Exception raised when vault encryption fails."""


class VaultNotFoundError(VaultError):
    """Exception raised when vault file is not found."""


class VaultClient:  # pylint: disable=too-few-public-methods
    """Client for interacting with Ansible Vault encrypted files."""

    def __init__(
        self,
        vault_password_file: Optional[str] = None,
        oauth_clients_vault_path: Optional[str] = None,
        auth_config_vault_path: Optional[str] = None,
    ):
        """Initialize the Vault client.

        Args:
            vault_password_file: Path to the Ansible Vault password file.
            oauth_clients_vault_path: Path to the OAuth clients vault file.
            auth_config_vault_path: Path to the auth configuration vault file.
        """
        self.vault_password_file = vault_password_file or os.getenv(
            "ANSIBLE_VAULT_PASSWORD_FILE", "/etc/omnia/.vault_pass"
        )
        self.oauth_clients_vault_path = oauth_clients_vault_path or os.getenv(
            "OAUTH_CLIENTS_VAULT_PATH",
            "/etc/omnia/input/project_default/build_stream_oauth_credentials.yml"
        )
        self.auth_config_vault_path = auth_config_vault_path or os.getenv(
            "AUTH_CONFIG_VAULT_PATH",
            "/etc/omnia/input/project_default/build_stream_oauth_credentials.yml"
        )

    _ALLOWED_VAULT_COMMANDS = frozenset({"view", "encrypt", "decrypt"})

    def _run_vault_command(
        self,
        command: str,
        vault_path: str,
    ) -> str:
        """Run an ansible-vault command.

        Args:
            command: The vault command (view, encrypt, decrypt).
            vault_path: Path to the vault file.

        Returns:
            Command output as string.

        Raises:
            VaultError: If command is not in allowlist.
            VaultNotFoundError: If vault file doesn't exist.
            VaultDecryptError: If decryption fails.
            VaultEncryptError: If encryption fails.
        """
        if command not in self._ALLOWED_VAULT_COMMANDS:
            raise VaultError("Invalid vault command")

        if command == "view" and not os.path.exists(vault_path):
            raise VaultNotFoundError(f"Vault file not found: {vault_path}")

        if not os.path.exists(self.vault_password_file):
            raise VaultError(f"Vault password file not found: {self.vault_password_file}")

        cmd = [
            "ansible-vault",
            command,
            vault_path,
            "--vault-password-file",
            self.vault_password_file,
        ]

        try:
            result = subprocess.run(
                cmd,
                capture_output=True,
                text=True,
                check=True,
                timeout=30,
            )
            return result.stdout
        except subprocess.CalledProcessError:
            logger.error("Vault command failed: %s", command)
            if command == "view":
                raise VaultDecryptError("Failed to decrypt vault") from None
            raise VaultEncryptError("Failed to encrypt vault") from None
        except subprocess.TimeoutExpired:
            logger.error("Vault command timed out: %s", command)
            raise VaultError("Vault operation timed out") from None

    def read_vault(self, vault_path: str) -> Dict[str, Any]:
        """Read and decrypt a vault file.

        Args:
            vault_path: Path to the vault file.

        Returns:
            Decrypted vault contents as dictionary.

        Raises:
            VaultNotFoundError: If vault file doesn't exist.
            VaultDecryptError: If decryption fails.
        """
        logger.debug("Reading vault: %s", vault_path)
        output = self._run_vault_command("view", vault_path)
        try:
            return yaml.safe_load(output) or {}
        except yaml.YAMLError:
            logger.error("Failed to parse vault YAML")
            raise VaultDecryptError("Invalid vault content format") from None

    def write_vault(self, vault_path: str, data: Dict[str, Any]) -> None:
        """Write data to an encrypted vault file.

        Args:
            vault_path: Path to the vault file.
            data: Data to encrypt and store.

        Raises:
            VaultEncryptError: If encryption fails.
        """
        logger.debug("Writing vault: %s", vault_path)

        yaml_content = yaml.safe_dump(data, default_flow_style=False)

        vault_dir = os.path.dirname(vault_path)
        if vault_dir and not os.path.exists(vault_dir):
            os.makedirs(vault_dir, mode=0o700, exist_ok=True)

        with tempfile.NamedTemporaryFile(
            mode="w",
            suffix=".yml",
            delete=False,
            encoding="utf-8",
        ) as temp_file:
            temp_file.write(yaml_content)
            temp_file.flush()
            os.fsync(temp_file.fileno())
            temp_path = temp_file.name

        try:
            logger.debug("Encrypting temp file: %s", temp_path)
            encrypt_cmd = [
                "ansible-vault",
                "encrypt",
                temp_path,
                "--vault-password-file",
                self.vault_password_file,
                "--encrypt-vault-id",
                "default",
            ]
            subprocess.run(
                encrypt_cmd,
                check=True,
                capture_output=True,
                text=True,
                timeout=30,
            )
            logger.debug("Encryption completed, reading encrypted content")

            with open(temp_path, "r", encoding="utf-8") as f:
                encrypted_content = f.read()

            with open(vault_path, "w", encoding="utf-8") as f:
                f.write(encrypted_content)

            os.chmod(vault_path, 0o600)
            logger.debug("Vault written successfully")

        except subprocess.CalledProcessError:
            raise VaultEncryptError("Failed to encrypt vault") from None
        except subprocess.TimeoutExpired:
            logger.error("Vault encryption timed out")
            raise VaultError("Vault operation timed out") from None
        finally:
            if os.path.exists(temp_path):
                os.unlink(temp_path)

    def get_auth_config(self) -> Dict[str, Any]:
        """Get authentication configuration from vault.

        Returns:
            Auth configuration dictionary containing registration credentials.

        Raises:
            VaultNotFoundError: If auth config vault doesn't exist.
            VaultDecryptError: If decryption fails.
        """
        return self.read_vault(self.auth_config_vault_path)

    def get_oauth_clients(self) -> Dict[str, Any]:
        """Get OAuth clients from vault.

        Returns:
            Dictionary of registered OAuth clients.

        Raises:
            VaultNotFoundError: If OAuth clients vault doesn't exist.
            VaultDecryptError: If decryption fails.
        """
        try:
            data = self.read_vault(self.oauth_clients_vault_path)
            return data.get("oauth_clients", {})
        except VaultNotFoundError:
            return {}

    def save_oauth_client(
        self,
        client_id: str,
        client_data: Dict[str, Any],
    ) -> None:
        """Save a new OAuth client to vault.

        Args:
            client_id: The client identifier.
            client_data: Client data including hashed secret and metadata.

        Raises:
            VaultEncryptError: If encryption fails.
        """
        try:
            existing_data = self.read_vault(self.oauth_clients_vault_path)
        except VaultNotFoundError:
            existing_data = {"oauth_clients": {}}

        if "oauth_clients" not in existing_data:
            existing_data["oauth_clients"] = {}

        existing_data["oauth_clients"][client_id] = client_data

        self.write_vault(self.oauth_clients_vault_path, existing_data)
        logger.info("OAuth client saved: %s", client_id[:8] + "...")

    def get_active_client_count(self) -> int:
        """Get the count of active registered clients.

        Returns:
            Number of active clients.
        """
        clients = self.get_oauth_clients()
        return sum(1 for c in clients.values() if c.get("is_active", True))

    def client_exists(self, client_name: str) -> bool:
        """Check if a client with the given name already exists.

        Args:
            client_name: The client name to check.

        Returns:
            True if client exists, False otherwise.
        """
        clients = self.get_oauth_clients()
        for client_data in clients.values():
            if client_data.get("client_name") == client_name:
                return True
        return False


================================================
FILE: build_stream/build_stream.ini
================================================
# BuildStream Configuration

[paths]
build_stream_base_path = /opt/omnia/build_stream_root

[artifact_store]
backend = file_store
working_dir = /tmp/build_stream

[file_store]
base_path = /opt/omnia/build_stream_root/artifacts


================================================
FILE: build_stream/common/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


================================================
FILE: build_stream/common/config.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Configuration loader for BuildStream."""

import os
from dataclasses import dataclass
from pathlib import Path
from typing import Optional

import configparser


@dataclass
class ArtifactStoreConfig:
    """Artifact store configuration."""
    backend: str
    working_dir: str
    max_file_size_bytes: int
    max_archive_uncompressed_bytes: int
    max_archive_entries: int


@dataclass
class PathsConfig:
    """BuildStream paths configuration."""
    build_stream_base_path: str


@dataclass
class FileStoreConfig:
    """File store configuration."""
    base_path: str


@dataclass
class BuildStreamConfig:
    """BuildStream configuration."""
    paths: PathsConfig
    artifact_store: ArtifactStoreConfig
    file_store: Optional[FileStoreConfig]


def load_config(config_path: Optional[str] = None) -> BuildStreamConfig:
    """Load BuildStream configuration from INI file.
    
    Args:
        config_path: Path to configuration file. If None, uses BUILD_STREAM_CONFIG_PATH
                    environment variable or default path.
    
    Returns:
        BuildStreamConfig instance.
    
    Raises:
        FileNotFoundError: If config file not found.
        ValueError: If config is invalid.
    """
    if config_path is None:
        config_path = os.getenv(
            "BUILD_STREAM_CONFIG_PATH",
            "/opt/omnia/windsurf/build_stream_venu_oim/build_stream/build_stream.ini"
        )
    
    config_file = Path(config_path)
    if not config_file.exists():
        raise FileNotFoundError(f"Configuration file not found: {config_file}")
    
    parser = configparser.ConfigParser()
    parser.read(config_file)
    
    if not parser.sections():
        raise ValueError(f"Empty configuration file: {config_file}")
    
    # Parse paths config
    paths_section = "paths"
    build_stream_base_path = parser.get(paths_section, "build_stream_base_path", fallback="/opt/omnia/build_stream_root")
    
    paths = PathsConfig(
        build_stream_base_path=build_stream_base_path,
    )
    
    # Parse artifact_store config
    artifact_store_section = "artifact_store"
    backend = parser.get(artifact_store_section, "backend", fallback="file_store")
    
    # Parse optional size limits with defaults
    max_file_size_bytes = 5242880  # 5MB default
    max_archive_uncompressed_bytes = 52428800  # 50MB default
    max_archive_entries = 500  # default
    
    if parser.has_option(artifact_store_section, "max_file_size_bytes"):
        max_file_size_bytes = parser.getint(artifact_store_section, "max_file_size_bytes")
    
    if parser.has_option(artifact_store_section, "max_archive_uncompressed_bytes"):
        max_archive_uncompressed_bytes = parser.getint(artifact_store_section, "max_archive_uncompressed_bytes")
    
    if parser.has_option(artifact_store_section, "max_archive_entries"):
        max_archive_entries = parser.getint(artifact_store_section, "max_archive_entries")
    
    artifact_store = ArtifactStoreConfig(
        backend=backend,
        working_dir=parser.get(artifact_store_section, "working_dir", fallback="/tmp/build_stream"),
        max_file_size_bytes=max_file_size_bytes,
        max_archive_uncompressed_bytes=max_archive_uncompressed_bytes,
        max_archive_entries=max_archive_entries,
    )
    
    # Parse file_store config only if backend is file_store
    file_store = None
    if backend == "file_store":
        if parser.has_section("file_store") and parser.has_option("file_store", "base_path"):
            file_store = FileStoreConfig(
                base_path=parser.get("file_store", "base_path")
            )
        else:
            raise ValueError("file_store section with base_path is required when backend=file_store")
    
    return BuildStreamConfig(
        paths=paths,
        artifact_store=artifact_store,
        file_store=file_store,
    )


================================================
FILE: build_stream/common/constants.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


================================================
FILE: build_stream/common/logging.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


================================================
FILE: build_stream/common/user_messages.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


================================================
FILE: build_stream/container.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Dependency Injector containers for the Build Stream API."""
# pylint: disable=c-extension-no-member

import os
from pathlib import Path

from dependency_injector import containers, providers

from infra.artifact_store.in_memory_artifact_store import InMemoryArtifactStore
from infra.artifact_store.in_memory_artifact_metadata import (
    InMemoryArtifactMetadataRepository,
)
from infra.artifact_store.file_artifact_store import FileArtifactStore
from infra.id_generator import JobUUIDGenerator, UUIDv4Generator
from infra.repositories import (
    InMemoryJobRepository,
    InMemoryStageRepository,
    InMemoryIdempotencyRepository,
    InMemoryAuditEventRepository,
    NfsInputRepository,
    NfsPlaybookQueueRequestRepository,
    NfsPlaybookQueueResultRepository,
)
from infra.db.repositories import (
    SqlJobRepository,
    SqlStageRepository,
    SqlIdempotencyRepository,
    SqlAuditEventRepository,
    SqlArtifactMetadataRepository,
)
from infra.db.session import SessionLocal
from orchestrator.catalog.use_cases.generate_input_files import GenerateInputFilesUseCase
from orchestrator.catalog.use_cases.parse_catalog import ParseCatalogUseCase
from orchestrator.jobs.use_cases import CreateJobUseCase
from orchestrator.local_repo.use_cases import CreateLocalRepoUseCase
from orchestrator.common.result_poller import ResultPoller
from orchestrator.build_image.use_cases import CreateBuildImageUseCase
from orchestrator.validate.use_cases import ValidateImageOnTestUseCase

from core.localrepo.services import (
    InputFileService,
    PlaybookQueueRequestService,
    PlaybookQueueResultService,
)
from core.build_image.services import (
    BuildImageConfigService,
)
from core.validate.services import ValidateQueueService
from core.catalog.adapter_policy import _DEFAULT_POLICY_PATH, _DEFAULT_SCHEMA_PATH
from core.artifacts.value_objects import SafePath
from common.config import load_config


def _create_artifact_store():
    """Factory function to create artifact store based on configuration.

    Returns:
        InMemoryArtifactStore or FileArtifactStore based on config.
    """
    try:
        config = load_config()

        # Check backend setting
        if config.artifact_store.backend == "file_store" and config.file_store is not None:
            base_path = Path(config.file_store.base_path)
            return FileArtifactStore(
                base_path=base_path,
                max_artifact_size_bytes=config.artifact_store.max_file_size_bytes,
            )

        if config.artifact_store.backend == "memory_store":
            return InMemoryArtifactStore(
                max_artifact_size_bytes=config.artifact_store.max_file_size_bytes,
            )

        # Fall back to file store with default path
        return FileArtifactStore(
            base_path=Path("/opt/omnia/build_stream_root/artifacts"),
            max_artifact_size_bytes=config.artifact_store.max_file_size_bytes,
        )
    except (FileNotFoundError, ValueError):
        # If config not found or invalid, use file store with defaults as fallback
        return FileArtifactStore(
            base_path=Path("/opt/omnia/build_stream_root/artifacts"),
            max_artifact_size_bytes=5242880,  # 5MB default
        )

_RESOURCES_DIR = Path(__file__).resolve().parent / "core" / "catalog" / "resources"
_DEFAULT_POLICY_PATH = _RESOURCES_DIR / "adapter_policy_default.json"
_DEFAULT_SCHEMA_PATH = _RESOURCES_DIR / "AdapterPolicySchema.json"


class DevContainer(containers.DeclarativeContainer):  # pylint: disable=R0903
    """Development profile container.

    Uses in-memory mock repositories for fast development and testing.
    No external dependencies (database, S3, etc.) required.

    Activated when ENV=dev.
    """

    wiring_config = containers.WiringConfiguration(
        modules=[
            "api.dependencies",
            "api.jobs.routes",
            "api.jobs.dependencies",
            "api.local_repo.routes",
            "api.local_repo.dependencies",
            "api.build_image.routes",
            "api.build_image.dependencies",
            "api.validate.routes",
            "api.validate.dependencies",
            "api.parse_catalog.routes",
            "api.parse_catalog.dependencies",
        ]
    )

    job_id_generator = providers.Singleton(JobUUIDGenerator)
    uuid_generator = providers.Singleton(UUIDv4Generator)


    default_policy_path = providers.Singleton(
        SafePath,
        value=_DEFAULT_POLICY_PATH,
    )

    policy_schema_path = providers.Singleton(
        SafePath,
        value=_DEFAULT_SCHEMA_PATH,
    )

    # --- Jobs repositories ---
    job_repository = providers.Singleton(InMemoryJobRepository)
    stage_repository = providers.Singleton(InMemoryStageRepository)
    idempotency_repository = providers.Singleton(InMemoryIdempotencyRepository)
    audit_repository = providers.Singleton(InMemoryAuditEventRepository)

    # --- input repository ---
    input_repository = providers.Singleton(
        NfsInputRepository,
    )

    # --- Queue repositories ---
    playbook_queue_request_repository = providers.Singleton(
        NfsPlaybookQueueRequestRepository,
    )

    playbook_queue_result_repository = providers.Singleton(
        NfsPlaybookQueueResultRepository,
    )

    # --- Local repo services ---
    input_file_service = providers.Factory(
        InputFileService,
        input_repo=input_repository,
    )

    # --- Build image services ---
    build_image_config_service = providers.Factory(
        BuildImageConfigService,
        config_repo=input_repository,
    )

    playbook_queue_request_service = providers.Factory(
        PlaybookQueueRequestService,
        request_repo=playbook_queue_request_repository,
    )

    playbook_queue_result_service = providers.Factory(
        PlaybookQueueResultService,
        result_repo=playbook_queue_result_repository,
    )

    # --- Validate services ---
    validate_queue_service = providers.Factory(
        ValidateQueueService,
        queue_repo=playbook_queue_request_repository,
    )

    # --- Result poller ---
    result_poller = providers.Singleton(
        ResultPoller,
        result_service=playbook_queue_result_service,
        job_repo=job_repository,
        stage_repo=stage_repository,
        audit_repo=audit_repository,
        uuid_generator=uuid_generator,
        poll_interval=int(os.getenv("RESULT_POLL_INTERVAL", "5")),
    )

    # --- Use cases ---
    artifact_store = providers.Singleton(_create_artifact_store)

    artifact_metadata_repository = providers.Singleton(
        InMemoryArtifactMetadataRepository,
    )

    create_job_use_case = providers.Factory(
        CreateJobUseCase,
        job_repo=job_repository,
        stage_repo=stage_repository,
        idempotency_repo=idempotency_repository,
        audit_repo=audit_repository,
        job_id_generator=job_id_generator,
        uuid_generator=uuid_generator,
    )

    create_local_repo_use_case = providers.Factory(
        CreateLocalRepoUseCase,
        job_repo=job_repository,
        stage_repo=stage_repository,
        audit_repo=audit_repository,
        input_file_service=input_file_service,
        playbook_queue_service=playbook_queue_request_service,
        uuid_generator=uuid_generator,
    )

    parse_catalog_use_case = providers.Factory(
        ParseCatalogUseCase,
        job_repo=job_repository,
        stage_repo=stage_repository,
        audit_repo=audit_repository,
        artifact_store=artifact_store,
        artifact_metadata_repo=artifact_metadata_repository,
        uuid_generator=uuid_generator,
    )

    generate_input_files_use_case = providers.Factory(
        GenerateInputFilesUseCase,
        job_repo=job_repository,
        stage_repo=stage_repository,
        audit_repo=audit_repository,
        artifact_store=artifact_store,
        artifact_metadata_repo=artifact_metadata_repository,
        uuid_generator=uuid_generator,
        default_policy_path=default_policy_path,
        policy_schema_path=policy_schema_path,
    )

    create_build_image_use_case = providers.Factory(
        CreateBuildImageUseCase,
        job_repo=job_repository,
        stage_repo=stage_repository,
        audit_repo=audit_repository,
        config_service=build_image_config_service,
        queue_service=playbook_queue_request_service,
        inventory_repo=input_repository,
        uuid_generator=uuid_generator,
    )

    validate_image_on_test_use_case = providers.Factory(
        ValidateImageOnTestUseCase,
        job_repo=job_repository,
        stage_repo=stage_repository,
        audit_repo=audit_repository,
        queue_service=validate_queue_service,
        uuid_generator=uuid_generator,
    )


class ProdContainer(containers.DeclarativeContainer):  # pylint: disable=R0903
    """Production profile container.

    Uses PostgreSQL-backed SQL repositories for persistent storage.

    Activated when ENV=prod (default).
    """

    wiring_config = containers.WiringConfiguration(
        modules=[
            "api.dependencies",
            "api.jobs.routes",
            "api.jobs.dependencies",
            "api.local_repo.routes",
            "api.local_repo.dependencies",
            "api.build_image.routes",
            "api.build_image.dependencies",
            "api.validate.routes",
            "api.validate.dependencies",
            "api.parse_catalog.routes",
            "api.parse_catalog.dependencies",
        ]
    )

    job_id_generator = providers.Singleton(JobUUIDGenerator)
    uuid_generator = providers.Singleton(UUIDv4Generator)


    default_policy_path = providers.Singleton(
        SafePath,
        value=_DEFAULT_POLICY_PATH,
    )

    policy_schema_path = providers.Singleton(
        SafePath,
        value=_DEFAULT_SCHEMA_PATH,
    )

    # --- Database session factory ---
    # Note: In prod, each repository gets its own session from this factory.
    # For shared sessions within a request, use FastAPI dependencies to inject
    # a single session and build repositories manually (see api/jobs/dependencies.py).
    db_session = providers.Factory(SessionLocal)

    # --- Jobs repositories (PostgreSQL-backed) ---
    job_repository = providers.Factory(SqlJobRepository, session=db_session)
    stage_repository = providers.Factory(SqlStageRepository, session=db_session)
    idempotency_repository = providers.Factory(SqlIdempotencyRepository, session=db_session)
    audit_repository = providers.Factory(SqlAuditEventRepository, session=db_session)

    # --- Consolidated input repository ---
    input_repository = providers.Singleton(
        NfsInputRepository,
    )

    # --- Queue repositories ---
    playbook_queue_request_repository = providers.Singleton(
        NfsPlaybookQueueRequestRepository,
    )

    playbook_queue_result_repository = providers.Singleton(
        NfsPlaybookQueueResultRepository,
    )

    # --- Local repo services ---
    input_file_service = providers.Factory(
        InputFileService,
        input_repo=input_repository,
    )

    playbook_queue_request_service = providers.Factory(
        PlaybookQueueRequestService,
        request_repo=playbook_queue_request_repository,
    )

    playbook_queue_result_service = providers.Factory(
        PlaybookQueueResultService,
        result_repo=playbook_queue_result_repository,
    )
    # --- Build image services ---
    build_image_config_service = providers.Factory(
        BuildImageConfigService,
        config_repo=input_repository,
    )

    # --- Validate services ---
    validate_queue_service = providers.Factory(
        ValidateQueueService,
        queue_repo=playbook_queue_request_repository,
    )

    # --- Result poller ---
    result_poller = providers.Singleton(
        ResultPoller,
        result_service=playbook_queue_result_service,
        job_repo=job_repository,
        stage_repo=stage_repository,
        audit_repo=audit_repository,
        uuid_generator=uuid_generator,
        poll_interval=int(os.getenv("RESULT_POLL_INTERVAL", "5")),
    )

    # --- Use cases ---
    artifact_store = providers.Singleton(_create_artifact_store)

    artifact_metadata_repository = providers.Factory(
        SqlArtifactMetadataRepository,
        session=db_session,
    )

    create_job_use_case = providers.Factory(
        CreateJobUseCase,
        job_repo=job_repository,
        stage_repo=stage_repository,
        idempotency_repo=idempotency_repository,
        audit_repo=audit_repository,
        job_id_generator=job_id_generator,
        uuid_generator=uuid_generator,
    )

    create_local_repo_use_case = providers.Factory(
        CreateLocalRepoUseCase,
        job_repo=job_repository,
        stage_repo=stage_repository,
        audit_repo=audit_repository,
        input_file_service=input_file_service,
        playbook_queue_service=playbook_queue_request_service,
        uuid_generator=uuid_generator,
    )

    parse_catalog_use_case = providers.Factory(
        ParseCatalogUseCase,
        job_repo=job_repository,
        stage_repo=stage_repository,
        audit_repo=audit_repository,
        artifact_store=artifact_store,
        artifact_metadata_repo=artifact_metadata_repository,
        uuid_generator=uuid_generator,
    )
    create_build_image_use_case = providers.Factory(
        CreateBuildImageUseCase,
        job_repo=job_repository,
        stage_repo=stage_repository,
        audit_repo=audit_repository,
        config_service=build_image_config_service,
        queue_service=playbook_queue_request_service,
        inventory_repo=input_repository,
        uuid_generator=uuid_generator,
    )

    validate_image_on_test_use_case = providers.Factory(
        ValidateImageOnTestUseCase,
        job_repo=job_repository,
        stage_repo=stage_repository,
        audit_repo=audit_repository,
        queue_service=validate_queue_service,
        uuid_generator=uuid_generator,
    )

    generate_input_files_use_case = providers.Factory(
        GenerateInputFilesUseCase,
        job_repo=job_repository,
        stage_repo=stage_repository,
        audit_repo=audit_repository,
        artifact_store=artifact_store,
        artifact_metadata_repo=artifact_metadata_repository,
        uuid_generator=uuid_generator,
        default_policy_path=default_policy_path,
        policy_schema_path=policy_schema_path,
    )


def get_container_class():
    """Select container class based on ENV environment variable.

    Returns:
        ProdContainer if ENV=prod (default)
        DevContainer if ENV=dev

    Usage:
        # Set environment variable before running
        ENV=dev python main.py

        # Or set in code before importing
        os.environ['ENV'] = 'dev'

        # Or set in shell
        export ENV=dev
        python main.py

        # Windows PowerShell
        $env:ENV = "dev"
        python main.py

        # Windows Command Prompt
        set ENV=dev
        python main.py
    """
    env = os.getenv("ENV", "prod").lower()

    if env == "prod":
        return ProdContainer

    return DevContainer


Container = get_container_class()

# Singleton container instance shared across app and dependencies
container = Container()

__all__ = ["Container", "container", "get_container_class"]


================================================
FILE: build_stream/core/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


================================================
FILE: build_stream/core/artifacts/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Artifact domain module for Build Stream."""

from .value_objects import (
    ArtifactKey,
    ArtifactDigest,
    ArtifactRef,
    ArtifactKind,
    StoreHint,
    SafePath,
)
from .exceptions import (
    ArtifactDomainError,
    ArtifactNotFoundError,
    ArtifactAlreadyExistsError,
    ArtifactStoreError,
    ArtifactValidationError,
)
from .entities import ArtifactRecord
from .ports import ArtifactStore, ArtifactMetadataRepository

__all__ = [
    "ArtifactKey",
    "ArtifactDigest",
    "ArtifactRef",
    "ArtifactKind",
    "StoreHint",
    "SafePath",
    "ArtifactDomainError",
    "ArtifactNotFoundError",
    "ArtifactAlreadyExistsError",
    "ArtifactStoreError",
    "ArtifactValidationError",
    "ArtifactRecord",
    "ArtifactStore",
    "ArtifactMetadataRepository",
]


================================================
FILE: build_stream/core/artifacts/entities.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Artifact domain entities."""

from dataclasses import dataclass
from datetime import datetime, timezone
from typing import Dict, Optional

from core.jobs.value_objects import JobId, StageName

from .value_objects import ArtifactKind, ArtifactRef


@dataclass
class ArtifactRecord:
    """Metadata entity linking an artifact to its producing context.

    Persisted in the Metadata Store for cross-stage artifact lookup.
    Each (job_id, stage_name, label) triple is unique.

    Attributes:
        id: Unique record identifier.
        job_id: Parent job identifier.
        stage_name: Stage that produced this artifact.
        label: Human-readable artifact label for cross-stage lookup.
        artifact_ref: Reference to the stored artifact content.
        kind: FILE or ARCHIVE.
        content_type: MIME content type.
        tags: Key-value metadata for queryability.
        created_at: Record creation timestamp.
    """

    id: str
    job_id: JobId
    stage_name: StageName
    label: str
    artifact_ref: ArtifactRef
    kind: ArtifactKind
    content_type: str = "application/octet-stream"
    tags: Optional[Dict[str, str]] = None
    created_at: Optional[datetime] = None

    LABEL_MAX_LENGTH: int = 128
    CONTENT_TYPE_MAX_LENGTH: int = 128

    def __post_init__(self) -> None:
        """Validate and initialize record fields."""
        if not self.label or not self.label.strip():
            raise ValueError("ArtifactRecord label cannot be empty")
        if len(self.label) > self.LABEL_MAX_LENGTH:
            raise ValueError(
                f"ArtifactRecord label length cannot exceed "
                f"{self.LABEL_MAX_LENGTH} characters, got {len(self.label)}"
            )
        if len(self.content_type) > self.CONTENT_TYPE_MAX_LENGTH:
            raise ValueError(
                f"ArtifactRecord content_type length cannot exceed "
                f"{self.CONTENT_TYPE_MAX_LENGTH} characters, "
                f"got {len(self.content_type)}"
            )
        if self.tags is None:
            self.tags = {}
        if self.created_at is None:
            self.created_at = datetime.now(timezone.utc)


================================================
FILE: build_stream/core/artifacts/exceptions.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Domain exceptions for Artifact aggregate."""

from typing import Optional


class ArtifactDomainError(Exception):
    """Base exception for all artifact domain errors."""

    def __init__(self, message: str, correlation_id: Optional[str] = None) -> None:
        """Initialize artifact domain error.

        Args:
            message: Human-readable error description.
            correlation_id: Optional correlation ID for tracing.
        """
        super().__init__(message)
        self.message = message
        self.correlation_id = correlation_id


class ArtifactNotFoundError(ArtifactDomainError):
    """Artifact does not exist in the store."""

    def __init__(
        self,
        key: str,
        correlation_id: Optional[str] = None,
    ) -> None:
        """Initialize artifact not found error.

        Args:
            key: The artifact key that was not found.
            correlation_id: Optional correlation ID for tracing.
        """
        super().__init__(
            f"Artifact not found: {key}",
            correlation_id=correlation_id,
        )
        self.key = key


class ArtifactAlreadyExistsError(ArtifactDomainError):
    """Artifact with the given key already exists (immutability enforced)."""

    def __init__(
        self,
        key: str,
        correlation_id: Optional[str] = None,
    ) -> None:
        """Initialize artifact already exists error.

        Args:
            key: The artifact key that already exists.
            correlation_id: Optional correlation ID for tracing.
        """
        super().__init__(
            f"Artifact already exists: {key}",
            correlation_id=correlation_id,
        )
        self.key = key


class ArtifactStoreError(ArtifactDomainError):
    """Infrastructure-level artifact store failure."""

    def __init__(
        self,
        message: str,
        correlation_id: Optional[str] = None,
    ) -> None:
        """Initialize artifact store error.

        Args:
            message: Human-readable error description.
            correlation_id: Optional correlation ID for tracing.
        """
        super().__init__(message, correlation_id=correlation_id)


class ArtifactValidationError(ArtifactDomainError):
    """Artifact content fails validation (size, content-type, etc.)."""

    def __init__(
        self,
        message: str,
        correlation_id: Optional[str] = None,
    ) -> None:
        """Initialize artifact validation error.

        Args:
            message: Human-readable validation error description.
            correlation_id: Optional correlation ID for tracing.
        """
        super().__init__(message, correlation_id=correlation_id)


================================================
FILE: build_stream/core/artifacts/interfaces.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Repository interfaces (Protocols) for Artifact domain.

These define the contracts that infrastructure implementations must satisfy.
"""

from pathlib import Path
from typing import Dict, List, Optional, Protocol, Union

from core.jobs.value_objects import JobId, StageName

from .entities import ArtifactRecord
from .value_objects import ArtifactKey, ArtifactKind, ArtifactRef, StoreHint


class ArtifactStore(Protocol):
    """Port for persisting and retrieving immutable artifact content.

    Unified API: callers pass ArtifactKind to indicate shape.
    The store dispatches internally based on kind.

    For ARCHIVE kind, callers provide either:
      - file_map: Dict[str, bytes] for in-memory content subsets
      - source_directory: Path for zipping an entire directory

    For FILE kind, callers provide:
      - content: bytes
    """

    def store(
        self,
        hint: StoreHint,
        kind: ArtifactKind,
        content: Optional[bytes] = None,
        file_map: Optional[Dict[str, bytes]] = None,
        source_directory: Optional[Path] = None,
        content_type: str = "application/octet-stream",
    ) -> ArtifactRef:
        """Store an artifact.

        Args:
            hint: Hints for deterministic key generation.
            kind: FILE or ARCHIVE.
            content: Raw bytes (required for FILE kind).
            file_map: Mapping of relative paths to bytes (ARCHIVE kind).
            source_directory: Directory to zip (ARCHIVE kind).
            content_type: MIME type of the content.

        Returns:
            ArtifactRef with key, digest, size, and URI.

        Raises:
            ArtifactAlreadyExistsError: If artifact with same key exists.
            ArtifactValidationError: If content fails validation.
            ArtifactStoreError: If storage operation fails.
            ValueError: If wrong inputs for the given kind.
        """
        ...

    def retrieve(
        self,
        key: ArtifactKey,
        kind: ArtifactKind,
        destination: Optional[Path] = None,
    ) -> Union[bytes, Path]:
        """Retrieve an artifact.

        For FILE kind: returns bytes (destination ignored).
        For ARCHIVE kind: unpacks to destination and returns the path.
            If destination is None, creates a temp directory.

        Args:
            key: Artifact key to retrieve.
            kind: FILE or ARCHIVE.
            destination: Target directory for ARCHIVE unpacking.

        Returns:
            bytes for FILE kind, Path for ARCHIVE kind.

        Raises:
            ArtifactNotFoundError: If artifact does not exist.
            ArtifactStoreError: If retrieval fails.
        """
        ...

    def exists(self, key: ArtifactKey) -> bool:
        """Check if an artifact exists.

        Args:
            key: Artifact key to check.

        Returns:
            True if artifact exists, False otherwise.
        """
        ...

    def delete(self, key: ArtifactKey) -> bool:
        """Delete an artifact.

        Args:
            key: Artifact key to delete.

        Returns:
            True if artifact was deleted, False if not found.
        """
        ...

    def generate_key(self, hint: StoreHint, kind: ArtifactKind) -> ArtifactKey:
        """Generate a deterministic artifact key from hints.

        Args:
            hint: Store hints for key generation.
            kind: FILE or ARCHIVE (affects extension).

        Returns:
            Deterministic ArtifactKey.
        """
        ...


class ArtifactMetadataRepository(Protocol):
    """Port for persisting artifact metadata records.

    Used for cross-stage artifact lookup by (job_id, stage_name, label).
    """

    def save(self, record: ArtifactRecord) -> None:
        """Persist an artifact metadata record.

        Args:
            record: ArtifactRecord to persist.
        """
        ...

    def find_by_job_stage_and_label(
        self,
        job_id: JobId,
        stage_name: StageName,
        label: str,
    ) -> Optional[ArtifactRecord]:
        """Find an artifact record by job, stage, and label.

        Args:
            job_id: Parent job identifier.
            stage_name: Stage that produced the artifact.
            label: Artifact label.

        Returns:
            ArtifactRecord if found, None otherwise.
        """
        ...

    def find_by_job(self, job_id: JobId) -> List[ArtifactRecord]:
        """Find all artifact records for a job.

        Args:
            job_id: Parent job identifier.

        Returns:
            List of ArtifactRecord (may be empty).
        """
        ...

    def delete_by_job(self, job_id: JobId) -> int:
        """Delete all artifact records for a job.

        Args:
            job_id: Parent job identifier.

        Returns:
            Number of records deleted.
        """
        ...


================================================
FILE: build_stream/core/artifacts/ports.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Repository port interfaces (Protocols) for Artifact domain.

These define the contracts that infrastructure implementations must satisfy.
"""

from pathlib import Path
from typing import Dict, List, Optional, Protocol, Union

from core.jobs.value_objects import JobId, StageName

from .entities import ArtifactRecord
from .value_objects import ArtifactKey, ArtifactKind, ArtifactRef, StoreHint


class ArtifactStore(Protocol):
    """Port for persisting and retrieving immutable artifact content.

    Unified API: callers pass ArtifactKind to indicate shape.
    The store dispatches internally based on kind.

    For ARCHIVE kind, callers provide either:
      - file_map: Dict[str, bytes] for in-memory content subsets
      - source_directory: Path for zipping an entire directory

    For FILE kind, callers provide:
      - content: bytes
    """

    def store(
        self,
        hint: StoreHint,
        kind: ArtifactKind,
        content: Optional[bytes] = None,
        file_map: Optional[Dict[str, bytes]] = None,
        source_directory: Optional[Path] = None,
        content_type: str = "application/octet-stream",
    ) -> ArtifactRef:
        """Store an artifact.

        Args:
            hint: Hints for deterministic key generation.
            kind: FILE or ARCHIVE.
            content: Raw bytes (required for FILE kind).
            file_map: Mapping of relative paths to bytes (ARCHIVE kind).
            source_directory: Directory to zip (ARCHIVE kind).
            content_type: MIME type of the content.

        Returns:
            ArtifactRef with key, digest, size, and URI.

        Raises:
            ArtifactAlreadyExistsError: If artifact with same key exists.
            ArtifactValidationError: If content fails validation.
            ArtifactStoreError: If storage operation fails.
            ValueError: If wrong inputs for the given kind.
        """
        ...

    def retrieve(
        self,
        key: ArtifactKey,
        kind: ArtifactKind,
        destination: Optional[Path] = None,
    ) -> Union[bytes, Path]:
        """Retrieve an artifact.

        For FILE kind: returns bytes (destination ignored).
        For ARCHIVE kind: unpacks to destination and returns the path.
            If destination is None, creates a temp directory.

        Args:
            key: Artifact key to retrieve.
            kind: FILE or ARCHIVE.
            destination: Target directory for ARCHIVE unpacking.

        Returns:
            bytes for FILE kind, Path for ARCHIVE kind.

        Raises:
            ArtifactNotFoundError: If artifact does not exist.
            ArtifactStoreError: If retrieval fails.
        """
        ...

    def exists(self, key: ArtifactKey) -> bool:
        """Check if an artifact exists.

        Args:
            key: Artifact key to check.

        Returns:
            True if artifact exists, False otherwise.
        """
        ...

    def delete(self, key: ArtifactKey) -> bool:
        """Delete an artifact.

        Args:
            key: Artifact key to delete.

        Returns:
            True if artifact was deleted, False if not found.
        """
        ...

    def generate_key(self, hint: StoreHint, kind: ArtifactKind) -> ArtifactKey:
        """Generate a deterministic artifact key from hints.

        Args:
            hint: Store hints for key generation.
            kind: FILE or ARCHIVE (affects extension).

        Returns:
            Deterministic ArtifactKey.
        """
        ...


class ArtifactMetadataRepository(Protocol):
    """Port for persisting artifact metadata records.

    Used for cross-stage artifact lookup by (job_id, stage_name, label).
    """

    def save(self, record: ArtifactRecord) -> None:
        """Persist an artifact metadata record.

        Args:
            record: ArtifactRecord to persist.
        """
        ...

    def find_by_job_stage_and_label(
        self,
        job_id: JobId,
        stage_name: StageName,
        label: str,
    ) -> Optional[ArtifactRecord]:
        """Find an artifact record by job, stage, and label.

        Args:
            job_id: Parent job identifier.
            stage_name: Stage that produced the artifact.
            label: Artifact label.

        Returns:
            ArtifactRecord if found, None otherwise.
        """
        ...

    def find_by_job(self, job_id: JobId) -> List[ArtifactRecord]:
        """Find all artifact records for a job.

        Args:
            job_id: Parent job identifier.

        Returns:
            List of ArtifactRecord (may be empty).
        """
        ...

    def delete_by_job(self, job_id: JobId) -> int:
        """Delete all artifact records for a job.

        Args:
            job_id: Parent job identifier.

        Returns:
            Number of records deleted.
        """
        ...


================================================
FILE: build_stream/core/artifacts/value_objects.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Value objects for Artifact domain.

All value objects are immutable and defined by their values, not identity.
"""

import re
from dataclasses import dataclass
from enum import Enum
from pathlib import Path, PurePosixPath
from typing import ClassVar, Dict, Optional


class ArtifactKind(str, Enum):
    """Shape of artifact content.

    FILE: Single file (e.g., catalog.json).
    ARCHIVE: Multiple files packed as a zip archive.
    """

    FILE = "FILE"
    ARCHIVE = "ARCHIVE"


@dataclass(frozen=True)
class SafePath:
    """Validated filesystem path value object.

    Wraps pathlib.Path with security validation to prevent
    path traversal attacks and enforce length constraints.

    Attributes:
        value: The validated Path object.

    Raises:
        ValueError: If path is empty, too long, or contains traversal sequences.
    """

    value: Path

    MAX_LENGTH: ClassVar[int] = 4096
    ENCODED_TRAVERSAL_PATTERNS: ClassVar[tuple] = ("%2e%2e", "%2E%2E")

    def __post_init__(self) -> None:
        """Validate path safety and length."""
        str_value = str(self.value)
        # Path("") resolves to "." in Python, so check original parts too
        if not str_value or not str_value.strip() or str_value == ".":
            raise ValueError("SafePath cannot be empty")
        if len(str_value) > self.MAX_LENGTH:
            raise ValueError(
                f"SafePath length cannot exceed {self.MAX_LENGTH} characters, "
                f"got {len(str_value)}"
            )
        # Check for '..' as a path component (directory traversal)
        if ".." in self.value.parts:
            raise ValueError(
                "SafePath must not contain path traversal component: .."
            )
        for pattern in self.ENCODED_TRAVERSAL_PATTERNS:
            if pattern in str_value:
                raise ValueError(
                    f"SafePath must not contain path traversal sequence: {pattern}"
                )
        if "\x00" in str_value:
            raise ValueError("SafePath must not contain null bytes")

    @classmethod
    def from_string(cls, path_str: str) -> "SafePath":
        """Create SafePath from a string.

        Args:
            path_str: String representation of the path.

        Returns:
            Validated SafePath instance.
        """
        return cls(value=Path(path_str))

    def __str__(self) -> str:
        """Return string representation."""
        return str(self.value)


@dataclass(frozen=True)
class ArtifactKey:
    """Unique key identifying an artifact in the store.

    Generated deterministically from StoreHint components.

    Attributes:
        value: Key string (e.g., "catalog/abc123/catalog-file.json").

    Raises:
        ValueError: If value is empty, too long, or contains traversal.
    """

    value: str

    MIN_LENGTH: ClassVar[int] = 1
    MAX_LENGTH: ClassVar[int] = 512

    def __post_init__(self) -> None:
        """Validate key format and length."""
        if not self.value or not self.value.strip():
            raise ValueError("ArtifactKey cannot be empty")
        if len(self.value) > self.MAX_LENGTH:
            raise ValueError(
                f"ArtifactKey length cannot exceed {self.MAX_LENGTH} characters, "
                f"got {len(self.value)}"
            )
        if ".." in self.value or "\\" in self.value:
            raise ValueError(
                f"ArtifactKey must not contain path traversal or backslash: {self.value}"
            )
        if self.value.startswith("/"):
            raise ValueError(
                f"ArtifactKey must not be an absolute path: {self.value}"
            )
        if "\x00" in self.value:
            raise ValueError("ArtifactKey must not contain null bytes")

    def __str__(self) -> str:
        """Return string representation."""
        return self.value


@dataclass(frozen=True)
class ArtifactDigest:
    """SHA-256 hex digest of artifact content.

    Attributes:
        value: 64-character lowercase hex string.

    Raises:
        ValueError: If value does not match SHA-256 pattern.
    """

    value: str

    SHA256_PATTERN: ClassVar[str] = r"^[0-9a-f]{64}$"
    MAX_LENGTH: ClassVar[int] = 64

    def __post_init__(self) -> None:
        """Validate SHA-256 format."""
        if len(self.value) > self.MAX_LENGTH:
            raise ValueError(
                f"ArtifactDigest length cannot exceed {self.MAX_LENGTH} characters, "
                f"got {len(self.value)}"
            )
        if not re.match(self.SHA256_PATTERN, self.value):
            raise ValueError(
                f"Invalid SHA-256 hex digest: {self.value}. "
                f"Expected 64 lowercase hexadecimal characters."
            )

    def __str__(self) -> str:
        """Return string representation."""
        return self.value


@dataclass(frozen=True)
class ArtifactRef:
    """Immutable reference to a stored artifact.

    Returned by ArtifactStore.store() after successful storage.

    Attributes:
        key: Unique artifact key.
        digest: SHA-256 content digest.
        size_bytes: Content size in bytes.
        uri: Storage-specific location URI.

    Raises:
        ValueError: If any field is invalid.
    """

    key: ArtifactKey
    digest: ArtifactDigest
    size_bytes: int
    uri: str

    URI_MAX_LENGTH: ClassVar[int] = 4096

    def __post_init__(self) -> None:
        """Validate artifact reference fields."""
        if self.size_bytes < 0:
            raise ValueError(
                f"size_bytes must be non-negative, got {self.size_bytes}"
            )
        if not self.uri:
            raise ValueError("ArtifactRef URI cannot be empty")
        if len(self.uri) > self.URI_MAX_LENGTH:
            raise ValueError(
                f"ArtifactRef URI length cannot exceed {self.URI_MAX_LENGTH} "
                f"characters, got {len(self.uri)}"
            )


@dataclass(frozen=True)
class StoreHint:
    """Hints for deterministic artifact key generation.

    Callers provide hints so the store can generate a deterministic,
    collision-free key. The namespace groups artifacts logically,
    the label identifies the artifact within a stage, and tags
    provide additional disambiguation (e.g., job_id).

    Attributes:
        namespace: Logical grouping (e.g., "catalog", "input-files").
        label: Human-readable artifact name (e.g., "catalog-file", "root-jsons").
        tags: Key-value metadata for disambiguation and queryability.

    Raises:
        ValueError: If namespace or label is invalid.
    """

    namespace: str
    label: str
    tags: Dict[str, str]

    NAMESPACE_MAX_LENGTH: ClassVar[int] = 128
    LABEL_MAX_LENGTH: ClassVar[int] = 128
    MAX_TAGS: ClassVar[int] = 20
    TAG_KEY_MAX_LENGTH: ClassVar[int] = 64
    TAG_VALUE_MAX_LENGTH: ClassVar[int] = 256

    def __post_init__(self) -> None:
        """Validate hint fields."""
        if not self.namespace or not self.namespace.strip():
            raise ValueError("StoreHint namespace cannot be empty")
        if len(self.namespace) > self.NAMESPACE_MAX_LENGTH:
            raise ValueError(
                f"StoreHint namespace length cannot exceed "
                f"{self.NAMESPACE_MAX_LENGTH} characters, got {len(self.namespace)}"
            )
        if not self.label or not self.label.strip():
            raise ValueError("StoreHint label cannot be empty")
        if len(self.label) > self.LABEL_MAX_LENGTH:
            raise ValueError(
                f"StoreHint label length cannot exceed "
                f"{self.LABEL_MAX_LENGTH} characters, got {len(self.label)}"
            )
        if len(self.tags) > self.MAX_TAGS:
            raise ValueError(
                f"StoreHint cannot have more than {self.MAX_TAGS} tags, "
                f"got {len(self.tags)}"
            )
        for key, val in self.tags.items():
            if len(key) > self.TAG_KEY_MAX_LENGTH:
                raise ValueError(
                    f"Tag key length cannot exceed {self.TAG_KEY_MAX_LENGTH} "
                    f"characters, got {len(key)}"
                )
            if len(val) > self.TAG_VALUE_MAX_LENGTH:
                raise ValueError(
                    f"Tag value length cannot exceed {self.TAG_VALUE_MAX_LENGTH} "
                    f"characters, got {len(val)}"
                )


================================================
FILE: build_stream/core/build/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


================================================
FILE: build_stream/core/build_image/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Build Image domain module.

This module contains domain logic for build image operations.
"""

from core.build_image.entities import BuildImageRequest
from core.build_image.exceptions import (
    BuildImageDomainError,
    InvalidArchitectureError,
    InvalidImageKeyError,
    InvalidFunctionalGroupsError,
)
from core.build_image.value_objects import (
    Architecture,
    ImageKey,
    FunctionalGroups,
    InventoryHost,
)

__all__ = [
    "BuildImageRequest",
    "BuildImageDomainError",
    "InvalidArchitectureError",
    "InvalidImageKeyError",
    "InvalidFunctionalGroupsError",
    "Architecture",
    "ImageKey",
    "FunctionalGroups",
    "InventoryHost",
]


================================================
FILE: build_stream/core/build_image/entities.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Domain entities for Build Image module."""

from dataclasses import dataclass
from datetime import datetime, timezone
from typing import Any, Dict, Optional

from core.localrepo.value_objects import ExecutionTimeout, ExtraVars, PlaybookPath


@dataclass(frozen=True)
# pylint: disable=too-many-instance-attributes
class BuildImageRequest:
    """Immutable entity representing a build image request.

    Written to the NFS queue for OIM Core consumption.
    Compatible with PlaybookRequest interface for reuse of existing repository.

    Attributes:
        job_id: Parent job identifier.
        stage_name: Stage identifier (build-image).
        playbook_path: Validated path to the playbook.
        extra_vars: Ansible extra variables (includes architecture, image_key, functional_groups).
        inventory_file_path: Optional path to inventory file for aarch64 builds.
        correlation_id: Request tracing identifier.
        timeout: Execution timeout configuration.
        submitted_at: Request submission timestamp.
        request_id: Unique request identifier.
    """

    job_id: str
    stage_name: str
    playbook_path: PlaybookPath
    extra_vars: ExtraVars
    correlation_id: str
    timeout: ExecutionTimeout
    submitted_at: str
    request_id: str
    inventory_file_path: Optional[str] = None

    def to_dict(self) -> Dict[str, Any]:
        """Serialize request to dictionary for JSON file writing."""
        request_dict = {
            "job_id": self.job_id,
            "stage_name": self.stage_name,
            "playbook_path": str(self.playbook_path),
            "extra_vars": self.extra_vars.to_dict(),
            "correlation_id": self.correlation_id,
            "timeout_minutes": self.timeout.minutes,
            "submitted_at": self.submitted_at,
            "request_id": self.request_id,
        }
        
        # Add inventory file path if present
        if self.inventory_file_path:
            request_dict["inventory_file_path"] = self.inventory_file_path
            
        return request_dict

    def generate_filename(self) -> str:
        """Generate request file name following naming convention.

        Returns:
            Filename: {job_id}_{stage_name}_{timestamp}.json
        """
        timestamp = datetime.now(timezone.utc).strftime("%Y%m%d_%H%M%S")
        return f"{self.job_id}_{self.stage_name}_{timestamp}.json"

    def get_playbook_command(self) -> str:
        """Generate the ansible-playbook command based on request parameters.

        Returns:
            Complete ansible-playbook command string.
        """
        # Base command
        cmd = f'ansible-playbook {self.playbook_path}'
        
        # Add inventory file for aarch64
        if self.inventory_file_path:
            cmd += f' -i {self.inventory_file_path}'
        
        # Add extra vars
        extra_vars = self.extra_vars.to_dict()
        cmd += f' -e job_id="{extra_vars["job_id"]}"'
        cmd += f' -e image_key="{extra_vars["image_key"]}"'
        cmd += f' -e functional_groups=\'{extra_vars["functional_groups"]}\''
        
        return cmd


================================================
FILE: build_stream/core/build_image/exceptions.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Build Image domain exceptions."""


class BuildImageDomainError(Exception):
    """Base exception for build image domain errors."""

    def __init__(self, message: str, correlation_id: str = ""):
        """Initialize domain error.

        Args:
            message: Error message.
            correlation_id: Request correlation ID for tracing.
        """
        super().__init__(message)
        self.message = message
        self.correlation_id = correlation_id


class InvalidArchitectureError(BuildImageDomainError):
    """Raised when architecture is invalid or unsupported."""


class InvalidImageKeyError(BuildImageDomainError):
    """Raised when image key is invalid."""


class InvalidFunctionalGroupsError(BuildImageDomainError):
    """Raised when functional groups are invalid."""


class InventoryHostMissingError(BuildImageDomainError):
    """Raised when inventory host is missing from configuration."""


================================================
FILE: build_stream/core/build_image/repositories.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Repository interfaces for Build Image module."""

from abc import ABC, abstractmethod
from pathlib import Path
from typing import Optional

from core.build_image.value_objects import Architecture, InventoryHost


class BuildStreamConfigRepository(ABC):
    """Repository for reading build stream configuration."""

    @abstractmethod
    def get_aarch64_inv_host(self, job_id: str) -> Optional[InventoryHost]:
        """Get aarch64 inventory host for builds.

        Args:
            job_id: Job identifier.

        Returns:
            Inventory host IP or None if not configured.

        Raises:
            ConfigFileError: If config file cannot be read.
        """
        ...


class BuildImageInventoryRepository(ABC):
    """Repository for creating and managing inventory files for aarch64 builds."""

    @abstractmethod
    def create_inventory_file(self, inventory_host: InventoryHost, job_id: str) -> Path:
        """Create an inventory file for aarch64 builds.

        Args:
            inventory_host: The inventory host IP address.
            job_id: Job identifier for tracking.

        Returns:
            Path to the created inventory file.

        Raises:
            IOError: If inventory file cannot be created.
        """
        ...


================================================
FILE: build_stream/core/build_image/services.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Domain services for Build Image module."""

import logging
from typing import Optional

from core.build_image.entities import BuildImageRequest
from core.build_image.exceptions import InventoryHostMissingError
from core.build_image.repositories import BuildStreamConfigRepository
from core.build_image.value_objects import Architecture, InventoryHost
from core.jobs.value_objects import CorrelationId

logger = logging.getLogger(__name__)


class BuildImageConfigService:
    """Service for build image configuration operations."""

    def __init__(self, config_repo: BuildStreamConfigRepository):
        """Initialize service with repository."""
        self._config_repo = config_repo

    def get_inventory_host(
        self, job_id: str, architecture: Architecture, correlation_id: str
    ) -> Optional[InventoryHost]:
        """Get inventory host for aarch64 builds.

        Args:
            job_id: Job identifier.
            architecture: Target architecture.
            correlation_id: Correlation ID for error reporting.

        Returns:
            Inventory host for aarch64, None for x86_64.

        Raises:
            InventoryHostMissingError: If aarch64 and no host configured.
        """
        if architecture.is_x86_64:
            return None

        # For aarch64, inventory host is required
        inventory_host = self._config_repo.get_aarch64_inv_host(job_id)
        if not inventory_host:
            raise InventoryHostMissingError(
                "Inventory host is required for aarch64 builds", correlation_id
            )
        return inventory_host


class BuildImageQueueService:
    """Service for build image queue operations."""

    def __init__(self, queue_repo):
        """Initialize service with PlaybookQueueRequestRepository."""
        self._queue_repo = queue_repo

    def submit_request(self, request: BuildImageRequest, correlation_id: CorrelationId):
        """Submit build image request to queue.

        Args:
            request: BuildImageRequest to submit.
            correlation_id: Correlation ID for tracing.

        Raises:
            QueueUnavailableError: If queue is not accessible.
        """
        logger.info(
            "Submitting build image request to queue: job_id=%s, correlation_id=%s",
            request.job_id,
            correlation_id,
        )
        self._queue_repo.write_request(request)
        logger.info(
            "Build image request submitted successfully: job_id=%s, "
            "request_id=%s, correlation_id=%s",
            request.job_id,
            request.request_id,
            correlation_id,
        )


================================================
FILE: build_stream/core/build_image/value_objects.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Value objects for Build Image domain.

All value objects are immutable and defined by their values, not identity.
"""

import re
from dataclasses import dataclass
from typing import ClassVar, List


@dataclass(frozen=True)
class Architecture:
    """Build image architecture type.

    Attributes:
        value: Architecture name (x86_64 or aarch64).

    Raises:
        ValueError: If architecture is not supported.
    """

    value: str

    SUPPORTED_ARCHITECTURES: ClassVar[List[str]] = ["x86_64", "aarch64"]

    def __post_init__(self) -> None:
        """Validate architecture."""
        if not self.value or not self.value.strip():
            raise ValueError("Architecture cannot be empty")
        if self.value not in self.SUPPORTED_ARCHITECTURES:
            raise ValueError(
                f"Unsupported architecture: {self.value}. "
                f"Supported: {', '.join(self.SUPPORTED_ARCHITECTURES)}"
            )

    def __str__(self) -> str:
        """Return string representation."""
        return self.value

    @property
    def is_x86_64(self) -> bool:
        """Check if architecture is x86_64."""
        return self.value == "x86_64"

    @property
    def is_aarch64(self) -> bool:
        """Check if architecture is aarch64."""
        return self.value == "aarch64"


@dataclass(frozen=True)
class ImageKey:
    """Image key identifier for build image.

    Attributes:
        value: Image key string.

    Raises:
        ValueError: If image key format is invalid.
    """

    value: str

    MAX_LENGTH: ClassVar[int] = 128
    KEY_PATTERN: ClassVar[str] = r'^[a-zA-Z0-9_\-]+$'

    def __post_init__(self) -> None:
        """Validate image key format."""
        if not self.value or not self.value.strip():
            raise ValueError("Image key cannot be empty")
        if len(self.value) > self.MAX_LENGTH:
            raise ValueError(
                f"Image key length cannot exceed {self.MAX_LENGTH} "
                f"characters, got {len(self.value)}"
            )
        if not re.match(self.KEY_PATTERN, self.value):
            raise ValueError(
                f"Invalid image key format: {self.value}. "
                f"Must contain only alphanumeric characters, underscores, and hyphens."
            )

    def __str__(self) -> str:
        """Return string representation."""
        return self.value


@dataclass(frozen=True)
class FunctionalGroups:
    """Functional groups list for build image.

    Attributes:
        groups: List of functional group names.

    Raises:
        ValueError: If functional groups are invalid.
    """

    groups: List[str]

    MAX_GROUPS: ClassVar[int] = 50
    GROUP_PATTERN: ClassVar[str] = r'^[a-zA-Z0-9_\-]+$'

    def __post_init__(self) -> None:
        """Validate functional groups."""
        if not self.groups:
            raise ValueError("Functional groups cannot be empty")
        if len(self.groups) > self.MAX_GROUPS:
            raise ValueError(
                f"Functional groups cannot exceed {self.MAX_GROUPS} groups, "
                f"got {len(self.groups)}"
            )
        for group in self.groups:
            if not group or not group.strip():
                raise ValueError("Functional group name cannot be empty")
            if not re.match(self.GROUP_PATTERN, group):
                raise ValueError(
                    f"Invalid functional group name: {group}. "
                    f"Must contain only alphanumeric characters, underscores, and hyphens."
                )

    def to_list(self) -> List[str]:
        """Return a copy of the groups list."""
        return list(self.groups)

    def __str__(self) -> str:
        """Return string representation."""
        return str(self.groups)


@dataclass(frozen=True)
class InventoryHost:
    """Inventory host IP address for aarch64 builds.

    Attributes:
        value: IP address or hostname.

    Raises:
        ValueError: If host format is invalid.
    """

    value: str

    MAX_LENGTH: ClassVar[int] = 255
    HOST_PATTERN: ClassVar[str] = r'^[a-zA-Z0-9\.\-]+$'

    def __post_init__(self) -> None:
        """Validate inventory host format."""
        if not self.value or not self.value.strip():
            raise ValueError("Inventory host cannot be empty")
        if len(self.value) > self.MAX_LENGTH:
            raise ValueError(
                f"Inventory host length cannot exceed {self.MAX_LENGTH} "
                f"characters, got {len(self.value)}"
            )
        if not re.match(self.HOST_PATTERN, self.value):
            raise ValueError(
                f"Invalid inventory host format: {self.value}. "
                f"Must contain only alphanumeric characters, dots, and hyphens."
            )

    def __str__(self) -> str:
        """Return string representation."""
        return self.value


================================================
FILE: build_stream/core/catalog/ADAPTER_POLICY_GUIDE.md
================================================
# Adapter Policy Guide

This guide explains how to write the **adapter policy file** (`adapter_policy_default.json`) to generate adapter config JSONs.

The adapter policy file lets you:

- Pull one or more **roles** (top-level keys) from one or more **source JSON files** into a **target JSON file**.
- Optionally **rename** roles while pulling.
- Optionally **filter** packages while pulling (substring, allowlist, or composite filters).
- Create a **derived role** that contains **common packages** across multiple roles.
- Remove those common packages from the source roles so packages do not appear twice.

---

## 1. What the generator expects

### 1.1 Source files

The generator reads source files from the `--input-dir` directory, for each architecture/OS/version:

```text
<input-dir>/<arch>/<os_family>/<os_version>/
  base_os.json
  functional_layer.json
  infrastructure.json
  miscellaneous.json
  ...
```

Each source file is expected to be an object where each top-level key is a **role** or **feature**, e.g. `"K8S Controller"`, `"K8S Worker"`, etc.

Each role has a `packages` list:

```json
{
  "K8S Controller": {
    "packages": [
      {"package": "kubeadm-v1.31.4-amd64", "type": "tarball", "uri": "..."}
    ]
  }
}
```

### 1.2 Output files

The mapping adapter writes target files under `--output-dir`:

```text
<output-dir>/<arch>/<os_family>/<os_version>/
  service_k8s.json
  slurm_custom.json
  default_packages.json
  ...
```

Each target file is an object of roles where each role contains a `cluster` list:

```json
{
  "service_kube_node": {
    "cluster": [
      {"package": "vim", "type": "rpm", "repo_name": "x86_64_appstream"}
    ]
  }
}
```

---

## 2. Adapter policy file structure

The adapter policy file is a JSON object with this shape:

- `version`: schema version (use `"2.0.0"`)
- `description`: human-readable
- `targets`: mapping of **target filename** -> **target specification**

At a high level:

```json
{
  "version": "2.0.0",
  "description": "...",
  "targets": {
    "service_k8s.json": {
      "transform": {"exclude_fields": ["architecture"]},
      "sources": [ ... ],
      "derived": [ ... ]
    }
  }
}
```

---

## 3. Target spec

A target spec describes how to build a single target file.

### 3.1 `transform` (optional)

Applied to all packages written in this target, unless overridden per pull.

Currently supported:

- `exclude_fields`: removes keys from each package object (commonly `architecture`).
- `rename_fields`: renames keys inside each package object.

### 3.2 `sources` (required)

A list of source specs. Each source spec pulls one or more roles from a single source file.

Each `source` has:

- `source_file`: e.g. `functional_layer.json`
- `pulls`: list of roles to pull

Each `pull` has:

- `source_key`: the role name in the source file
- `target_key` (optional): rename the role in the output. If omitted, the role name is unchanged.
- `filter` (optional): filter packages while pulling
- `transform` (optional): per-role transform override

### 3.3 `derived` (optional)

Defines derived roles that are computed from roles already pulled into the target.

Currently supported derived operation:

- `extract_common`
  - Computes packages that appear in `min_occurrences` or more of the `from_keys` roles
  - Writes them into `target_key`
  - If `remove_from_sources=true`, those common packages are removed from each role in `from_keys`

---

## 4. Fully worked example: `service_k8s.json`

Goal:

- Pull two roles from `functional_layer.json`
  - `K8S Controller` -> `service_kube_control_plane`
  - `K8S Worker` -> `service_kube_node`
- Derive a new role called `service_k8s` containing packages common to both pulled roles
- Remove those common packages from `service_kube_control_plane` and `service_kube_node`

```json
{
  "version": "2.0.0",
  "description": "Example mapping: build service_k8s.json from functional_layer.json",
  "targets": {
    "service_k8s.json": {
      "transform": {
        "exclude_fields": ["architecture"]
      },
      "sources": [
        {
          "source_file": "functional_layer.json",
          "pulls": [
            {
              "source_key": "K8S Controller",
              "target_key": "service_kube_control_plane"
            },
            {
              "source_key": "K8S Worker",
              "target_key": "service_kube_node"
            }
          ]
        }
      ],
      "derived": [
        {
          "target_key": "service_k8s",
          "operation": {
            "type": "extract_common",
            "from_keys": ["service_kube_control_plane", "service_kube_node"],
            "min_occurrences": 2,
            "remove_from_sources": true
          }
        }
      ]
    }
  }
}
```

Resulting output file (`service_k8s.json`) will contain:

- `service_kube_control_plane`: only control-plane-unique packages
- `service_kube_node`: only node-unique packages
- `service_k8s`: the common packages extracted from both

---

## 5. Filter types

Filters select which packages to include when pulling from a source role.

### 5.1 `substring` filter

Keeps packages where the specified `field` **contains** any of the `values` as a substring.

| Property | Type | Default | Description |
|----------|------|---------|-------------|
| `type` | `"substring"` | — | Filter type |
| `field` | string | `"package"` | Field to match against |
| `values` | array of strings | — | Substrings to search for |
| `case_sensitive` | boolean | `false` | Case-sensitive matching |

**Example** — keep packages containing `nfs`:

```json
{
  "filter": {
    "type": "substring",
    "field": "package",
    "values": ["nfs"],
    "case_sensitive": false
  }
}
```

### 5.2 `allowlist` filter

Keeps packages where the specified `field` **exactly equals** one of the `values`.

| Property | Type | Default | Description |
|----------|------|---------|-------------|
| `type` | `"allowlist"` | — | Filter type |
| `field` | string | `"package"` | Field to match against |
| `values` | array of strings | — | Exact values to allow |
| `case_sensitive` | boolean | `false` | Case-sensitive matching |

**Example** — keep only specific package names:

```json
{
  "filter": {
    "type": "allowlist",
    "field": "package",
    "values": ["openldap", "openldap-clients", "openldap-servers"],
    "case_sensitive": false
  }
}
```

### 5.3 `any_of` composite filter

Combines multiple filters with **OR** logic: a package is kept if it matches **any** of the nested filters.

| Property | Type | Description |
|----------|------|-------------|
| `type` | `"any_of"` | Filter type |
| `filters` | array of filter objects | Sub-filters to evaluate |

**Example** — keep packages matching an allowlist **or** a substring:

```json
{
  "filter": {
    "type": "any_of",
    "filters": [
      {
        "type": "allowlist",
        "field": "package",
        "values": ["openldap", "openldap-clients", "openldap-servers"],
        "case_sensitive": false
      },
      {
        "type": "substring",
        "field": "package",
        "values": ["ldap", "slapd"],
        "case_sensitive": false
      }
    ]
  }
}
```

---

## 6. Example: substring filtering (`nfs.json`)

Goal:

- Pull `Base OS` packages from `base_os.json`
- Only keep packages whose `package` contains substring `"nfs"`

```json
{
  "version": "2.0.0",
  "description": "Example mapping: build nfs.json from base_os.json",
  "targets": {
    "nfs.json": {
      "transform": {
        "exclude_fields": ["architecture"]
      },
      "sources": [
        {
          "source_file": "base_os.json",
          "pulls": [
            {
              "source_key": "Base OS",
              "target_key": "nfs",
              "filter": {
                "type": "substring",
                "field": "package",
                "values": ["nfs"],
                "case_sensitive": false
              }
            }
          ]
        }
      ]
    }
  }
}
```

---

## 7. Example: composite filtering (`openldap.json`)

Goal:

- Pull `Base OS` packages from `base_os.json`
- Keep packages that match **either**:
  - An explicit allowlist of known OpenLDAP package names, **or**
  - A broadened substring search (`ldap`, `openldap`, `slapd`)

```json
{
  "version": "2.0.0",
  "description": "Example mapping: build openldap.json using composite filter",
  "targets": {
    "openldap.json": {
      "transform": {
        "exclude_fields": ["architecture"]
      },
      "sources": [
        {
          "source_file": "base_os.json",
          "pulls": [
            {
              "source_key": "Base OS",
              "target_key": "openldap",
              "filter": {
                "type": "any_of",
                "filters": [
                  {
                    "type": "allowlist",
                    "field": "package",
                    "values": ["openldap", "openldap-clients", "openldap-servers"],
                    "case_sensitive": false
                  },
                  {
                    "type": "substring",
                    "field": "package",
                    "values": ["ldap", "openldap", "slapd"],
                    "case_sensitive": false
                  }
                ]
              }
            }
          ]
        }
      ]
    }
  }
}
```

---


## 8. Tips and common mistakes

- **Role names must match exactly**: `source_key` must exist in the source JSON.
- **Derived roles operate on target role names**: `from_keys` refers to the names after renaming (`target_key`).
- If you set `remove_from_sources=true`, verify you included the right keys in `from_keys`.
- Filters apply *before* transforms.


================================================
FILE: build_stream/core/catalog/README.md
================================================
| Code | Name                      | When it happens                                                                 |
|------|---------------------------|---------------------------------------------------------------------------------|
| 0    | SUCCESS                   | All processing completed successfully.                                         |
| 2    | ERROR_CODE_INPUT_NOT_FOUND | Required input file is missing (catalog, schema, or a file needed during processing). |
| 3    | ERROR_CODE_PROCESSING_ERROR | Any other unexpected runtime error while parsing or generating outputs.       |

## Usage

### Catalog Parser CLI (`generator.py`)

Generates per-arch/OS/version feature-list JSONs (functional layer, infra, drivers, base OS, miscellaneous).

From the `poc/milestone-1` directory, run the generator as a module:

```bash
python -m catalog_parser.generator \
  --catalog <path-to-catalog.json> \
  [--schema <path-to-schema.json>] \
  [--log-file <path-to-log-file>]
```

- `--catalog` (required): Path to input catalog JSON file.
- `--schema` (optional, default: `resources/CatalogSchema.json`): Path to catalog schema JSON file.
- `--log-file` (optional): Path to log file; if set, the directory is auto-created, otherwise logs go to stderr.

Outputs are written under:

```text
out/main/<arch>/<os_name>/<version>/
  functional_layer.json
  infrastructure.json
  drivers.json
  base_os.json
  miscellaneous.json
```

### Adapter Config Generator (`adapter.py`)

Generates adapter-style config JSONs from the catalog.

From the `poc/milestone-1` directory, run the adapter as a module:

```bash
python -m catalog_parser.adapter \
  --catalog <path-to-catalog.json> \
  [--schema <path-to-schema.json>] \
  [--log-file <path-to-log-file>]
```

- `--catalog` (required): Path to input catalog JSON file.
- `--schema` (optional, default: `resources/CatalogSchema.json`): Path to catalog schema JSON file.
- `--log-file` (optional): Path to log file; if set, the directory is auto-created, otherwise logs go to stderr.

Outputs are written under:

```text
out/adapter/input/config/<arch>/<os_name>/<version>/
  default_packages.json
  nfs.json / openldap.json / openmpi.json (if data)
  service_k8s.json
  slurm_custom.json
  <infra-feature>.json ...
```

### Programmatic usage

You can also call both components directly from Python without going through the CLI.

#### Catalog Parser API (`generator.py`)

Programmatic entry points:

- `generate_root_json_from_catalog(catalog_path, schema_path="resources/CatalogSchema.json", output_root="out/generator", *, log_file=None, configure_logging=False, log_level=logging.INFO)`
- `get_functional_layer_roles_from_file(functional_layer_json_path, *, configure_logging=False, log_file=None, log_level=logging.INFO)`
- `get_package_list(functional_layer_json_path, role=None, *, configure_logging=False, log_file=None, log_level=logging.INFO)`

Behavior:

- Optionally configures logging when `configure_logging=True` (and will create the log directory if needed).
- `generate_root_json_from_catalog` writes per-arch/OS/version feature-list JSONs under `output_root/<arch>/<os>/<version>/`.
- `get_functional_layer_roles_from_file` reads a `functional_layer.json` file, validates it, and returns a list of role names (feature names) present in the functional layer.
- `get_package_list` reads a `functional_layer.json` file and returns a list of role objects with their packages, suitable for use by REST APIs or other callers.

Example usage:

```python
from catalog_parser.generator import (
    get_functional_layer_roles_from_file,
    get_package_list,
)

functional_layer_path = "out/main/x86_64/rhel/10/functional_layer.json"

# Get all functional layer roles
roles = get_functional_layer_roles_from_file(functional_layer_path)

# roles might look like: ["Compiler", "K8S Controller", "K8S Worker", ...]

# Get packages for a specific role (case-insensitive role name)
compiler_packages = get_package_list(functional_layer_path, role="compiler")

# Get packages for all roles
all_role_packages = get_package_list(functional_layer_path)
```

Notes:

- Role matching is case-insensitive (for example, `"k8s controller"` matches `"K8S Controller"`).
- Passing `role=None` returns all roles.
- Passing an empty string for `role` is treated as invalid input and raises `ValueError`.

#### Adapter Config API (`adapter.py`)

Programmatic entry point:

- `generate_omnia_json_from_catalog(catalog_path, schema_path="resources/CatalogSchema.json", output_root="out/adapter/input/config", *, log_file=None, configure_logging=False, log_level=logging.INFO)`

Behavior:

- Optionally configures logging when `configure_logging=True` (and will create the log directory if needed).
- Writes adapter-style config JSONs under `output_root/<arch>/<os>/<version>/`.

#### Sample code

Example Python code showing how to call these APIs programmatically is available in:

- `tests/sample.py`


================================================
FILE: build_stream/core/catalog/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


================================================
FILE: build_stream/core/catalog/adapter.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Catalog parser adapter.

Transforms generated feature-list JSONs into omnia configuration JSONs.
"""

import json
import os
from collections import Counter
from typing import Dict, Iterable, List, Tuple, Optional
import argparse
import logging
import sys
from jsonschema import ValidationError

from .parser import ParseCatalog
from .models import Catalog
from .generator import (
    FeatureList,
    Feature,
    Package,
    generate_functional_layer_json,
    generate_infrastructure_json,
    generate_base_os_json,
    generate_miscellaneous_json,
    _filter_featurelist_for_arch,
    _discover_arch_os_version_from_catalog,
    _package_common_dict,
    _validate_catalog_and_schema_paths,
)
from .utils import _configure_logging

logger = logging.getLogger(__name__)

_BASE_DIR = os.path.dirname(__file__)
_DEFAULT_SCHEMA_PATH = os.path.join(_BASE_DIR, "resources", "CatalogSchema.json")

ERROR_CODE_INPUT_NOT_FOUND = 2
ERROR_CODE_PROCESSING_ERROR = 3


def _snake_case(name: str) -> str:
    return name.strip().lower().replace(" ", "_")


def _package_key(pkg: Package) -> Tuple[str, str, str]:
    """Key used to detect common packages across features.

    Uses (package, type, repo_name) to distinguish identical names in different repos/types.
    """
    return (pkg.package, pkg.type, pkg.repo_name)


def _package_to_dict(pkg: Package) -> Dict[str, str]:
    # Adapter-specific wrapper over the shared helper; note that the
    # adapter JSONs intentionally do not include architecture.
    return _package_common_dict(pkg)  # type: ignore[return-value]


# -------------------------- Base OS / default packages --------------------------


def build_default_packages_config(base_os: FeatureList) -> Dict:
    """Build default_packages.json-style structure from Base OS FeatureList.

    Expected FeatureList has a feature named "Base OS".
    """
    feature: Feature | None = base_os.features.get("Base OS")
    if feature is None:
        raise ValueError("Base OS feature not found in base_os FeatureList")

    cluster = [_package_to_dict(pkg) for pkg in feature.packages]
    logger.info("Built default_packages config with %d package(s)", len(cluster))
    return {"default_packages": {"cluster": cluster}}


def _build_subconfig_from_base_os(
    base_os: FeatureList, name: str, substrings: Iterable[str]
) -> Dict | None:
    """Generic helper to build nfs/openldap/openmpi-style configs.

    Selects packages from Base OS whose package name contains any of the substrings.
    Returns None if no packages match.
    """
    feature: Feature | None = base_os.features.get("Base OS")
    if feature is None:
        return None

    lowered = [s.lower() for s in substrings]
    selected = [
        pkg
        for pkg in feature.packages
        if any(sub in pkg.package.lower() for sub in lowered)
    ]
    if not selected:
        logger.info("No %s packages found in Base OS for substrings %s", name, list(substrings))
        return None

    cluster = [_package_to_dict(pkg) for pkg in selected]
    logger.info("Built %s config with %d package(s)", name, len(cluster))
    return {name: {"cluster": cluster}}


def build_nfs_config(base_os: FeatureList) -> Dict | None:
    """Build nfs config from Base OS FeatureList."""
    return _build_subconfig_from_base_os(base_os, "nfs", ["nfs"])


def build_openldap_config(base_os: FeatureList) -> Dict | None:
    """Build openldap config from Base OS FeatureList."""
    return _build_subconfig_from_base_os(base_os, "openldap", ["ldap"])


def build_openmpi_config(base_os: FeatureList) -> Dict | None:
    """Build openmpi config from Base OS FeatureList."""
    return _build_subconfig_from_base_os(base_os, "openmpi", ["openmpi"])


# -------------------------- K8s services from functional layer --------------------------


def build_service_k8s_config(functional: FeatureList) -> Dict:
    """Build service_k8s.json-like structure from functional FeatureList.

    Uses feature names "K8S Controller" and "K8S Worker" if present.
    Common packages (intersection) go into service_k8s; they are removed from the
    controller/worker clusters.
    """
    controller: Feature | None = functional.features.get("K8S Controller")
    worker: Feature | None = functional.features.get("K8S Worker")

    if controller is None or worker is None:
        raise ValueError("K8S Controller or K8S Worker feature not found in functional layer")

    ctrl_pkgs = controller.packages
    node_pkgs = worker.packages

    ctrl_keys = {_package_key(p) for p in ctrl_pkgs}
    node_keys = {_package_key(p) for p in node_pkgs}
    common_keys = ctrl_keys & node_keys

    def _filter(pkgs: List[Package], exclude: set[Tuple[str, str, str]]) -> List[Package]:
        return [p for p in pkgs if _package_key(p) not in exclude]

    # Keep order, but only one instance of each common key
    seen_common: set[Tuple[str, str, str]] = set()
    common_pkgs: List[Package] = []
    for pkg in ctrl_pkgs + node_pkgs:
        k = _package_key(pkg)
        if k in common_keys and k not in seen_common:
            seen_common.add(k)
            common_pkgs.append(pkg)

    logger.info(
        "Built service_k8s config: %d controller pkg(s), %d worker pkg(s), %d common pkg(s)",
        len(ctrl_pkgs),
        len(node_pkgs),
        len(common_pkgs),
    )

    return {
        "service_kube_control_plane": {
            "cluster": [_package_to_dict(p) for p in _filter(ctrl_pkgs, common_keys)]
        },
        "service_kube_node": {
            "cluster": [_package_to_dict(p) for p in _filter(node_pkgs, common_keys)]
        },
        "service_k8s": {"cluster": [_package_to_dict(p) for p in common_pkgs]},
    }


# -------------------------- Slurm custom from functional layer --------------------------


def build_slurm_custom_config(functional: FeatureList) -> Dict:
    """Build slurm_custom.json-style structure from functional FeatureList.

    Nodes used:
      - "Login Node"
      - "Compiler"
      - "Slurm Controller"
      - "Slurm Worker"

    Common packages are those that appear in any 2 or more of these nodes. They
    are removed from the individual node clusters and placed into slurm_custom.
    """
    login = functional.features.get("Login Node")
    compiler = functional.features.get("Compiler")
    slurm_ctrl = functional.features.get("Slurm Controller")
    slurm_worker = functional.features.get("Slurm Worker")

    if not all([login, compiler, slurm_ctrl, slurm_worker]):
        raise ValueError("One or more required Slurm-related features not found in functional layer")

    node_features: Dict[str, Feature] = {
        "login_node": login,
        "login_compiler_node": compiler,
        "slurm_control_node": slurm_ctrl,
        "slurm_node": slurm_worker,
    }

    # Count how many nodes each package appears in
    key_counts: Counter[Tuple[str, str, str]] = Counter()
    key_to_pkg: Dict[Tuple[str, str, str], Package] = {}

    for feature in node_features.values():
        seen_in_this_node: set[Tuple[str, str, str]] = set()
        for pkg in feature.packages:
            k = _package_key(pkg)
            key_to_pkg.setdefault(k, pkg)
            if k not in seen_in_this_node:
                seen_in_this_node.add(k)
                key_counts[k] += 1

    common_keys = {k for k, count in key_counts.items() if count >= 2}

    # Build node clusters without common packages
    output: Dict[str, Dict] = {}
    for node_name, feature in node_features.items():
        filtered_pkgs = [
            _package_to_dict(pkg)
            for pkg in feature.packages
            if _package_key(pkg) not in common_keys
        ]
        output[node_name] = {"cluster": filtered_pkgs}

    # Build slurm_custom cluster from common packages (dedup, keep deterministic order)
    common_pkg_dicts: List[Dict[str, str]] = []
    for k, pkg in key_to_pkg.items():
        if k in common_keys:
            common_pkg_dicts.append(_package_to_dict(pkg))

    output["slurm_custom"] = {"cluster": common_pkg_dicts}

    logger.info(
        "Built slurm_custom config with %d node cluster(s) and %d common package(s)",
        len(node_features),
        len(common_pkg_dicts),
    )

    return output


# -------------------------- Infrastructure splitting --------------------------


def build_infra_configs(infra: FeatureList) -> Dict[str, Dict]:
    """Split infrastructure FeatureList into separate config-style JSON structures.

    Returns a mapping of filename -> JSON dict. Filenames and top-level keys are
    derived from the feature names, with a special case for CSI to match the
    existing csi_driver_powerscale.json pattern.
    """
    configs: Dict[str, Dict] = {}

    for feature_name, feature in infra.features.items():
        name_snake = _snake_case(feature_name)

        if feature_name.lower() == "csi":
            file_name = "csi_driver_powerscale.json"
            top_key = "csi_driver_powerscale"
        else:
            file_name = f"{name_snake}.json"
            top_key = name_snake

        cluster = [_package_to_dict(pkg) for pkg in feature.packages]
        configs[file_name] = {top_key: {"cluster": cluster}}

    logger.info("Built %d infrastructure config file(s)", len(configs))

    return configs


# -------------------------- Utility: write configs to disk --------------------------


def write_config_files(configs: Dict[str, Dict], output_dir: str) -> None:
    """Write multiple config JSONs into an output directory.

    - configs: mapping of filename -> JSON-serializable dict
    - output_dir: directory under which files will be written
    """
    os.makedirs(output_dir, exist_ok=True)
    logger.info("Writing %d config file(s) to %s", len(configs), output_dir)
    for filename, data in configs.items():
        path = os.path.join(output_dir, filename)
        logger.debug("Writing config file %s", path)
        with open(path, "w", encoding="utf-8") as out_file:
            # Expect shape: { top_key: { "cluster": [pkg_dicts...] } }
            out_file.write("{\n")

            items = list(data.items())
            for i, (top_key, body) in enumerate(items):
                out_file.write(f"  {json.dumps(top_key)}: {{\n")
                out_file.write("    \"cluster\": [\n")

                pkgs = body.get("cluster", [])
                for j, pkg in enumerate(pkgs):
                    line = "      " + json.dumps(pkg, separators=(", ", ": "))
                    if j < len(pkgs) - 1:
                        line += ","
                    out_file.write(line + "\n")

                out_file.write("    ]\n")
                out_file.write("  }")
                if i < len(items) - 1:
                    out_file.write(",\n")
                else:
                    out_file.write("\n")

            out_file.write("}\n")


def generate_all_configs(
    functional: FeatureList,
    infra: FeatureList,
    base_os: FeatureList,
    misc: FeatureList,
    catalog: Catalog,
    output_root: str,
) -> None:
    """Driver that builds and writes all config-style JSONs.

    For each (arch, os_name, version) combination present in the Catalog's
    FunctionalPackages/OSPackages, this writes a full set of config-style
    JSONs under:

        output_root/<arch>/<os_name>/<version>

    Files written (if data available):
      - default_packages.json
      - nfs.json
      - openldap.json
      - openmpi.json
      - service_k8s.json
      - slurm_custom.json
      - one file per infrastructure feature (e.g. csi_driver_powerscale.json)
    """

    combos = _discover_arch_os_version_from_catalog(catalog)
    logger.info("Generating adapter configs for %d combination(s)", len(combos))
    for arch, os_name, version in combos:
        functional_arch = _filter_featurelist_for_arch(functional, arch)
        base_os_arch = _filter_featurelist_for_arch(base_os, arch)
        infra_arch = _filter_featurelist_for_arch(infra, arch)
        misc_arch = _filter_featurelist_for_arch(misc, arch)

        logger.info(
            "Building configs for arch=%s os=%s version=%s", arch, os_name, version
        )

        configs: Dict[str, Dict] = {}

        configs["default_packages.json"] = build_default_packages_config(base_os_arch)

        for filename, builder in (
            ("nfs.json", build_nfs_config),
            ("openldap.json", build_openldap_config),
            ("openmpi.json", build_openmpi_config),
        ):
            cfg = builder(base_os_arch)
            if cfg:
                configs[filename] = cfg

        configs["service_k8s.json"] = build_service_k8s_config(functional_arch)
        configs["slurm_custom.json"] = build_slurm_custom_config(functional_arch)

        misc_feature: Feature | None = misc_arch.features.get("Miscellaneous")
        if misc_feature is not None and misc_feature.packages:
            configs["miscellaneous.json"] = {
                "miscellaneous": {
                    "cluster": [_package_to_dict(p) for p in misc_feature.packages]
                }
            }

        infra_configs = build_infra_configs(infra_arch)
        configs.update(infra_configs)

        output_dir = os.path.join(output_root, arch, os_name, version)
        write_config_files(configs, output_dir)


def generate_omnia_json_from_catalog(
    catalog_path: str,
    schema_path: str = _DEFAULT_SCHEMA_PATH,
    output_root: str = "out/adapter/input/config",
    *,
    log_file: Optional[str] = None,
    configure_logging: bool = False,
    log_level: int = logging.INFO,
) -> None:
    """Generate adapter configuration JSONs for a catalog file.

    - If configure_logging is True, logging is configured using _configure_logging,
      optionally writing to log_file.
    - On missing files, FileNotFoundError is raised after logging an error.
    - No sys.exit is called; callers are expected to handle exceptions.
    """

    if configure_logging:
        _configure_logging(log_file=log_file, log_level=log_level)

    _validate_catalog_and_schema_paths(catalog_path, schema_path)

    catalog = ParseCatalog(catalog_path, schema_path)

    functional_layer_json = generate_functional_layer_json(catalog)
    infrastructure_json = generate_infrastructure_json(catalog)
    base_os_json = generate_base_os_json(catalog)
    miscellaneous_json = generate_miscellaneous_json(catalog)

    generate_all_configs(
        functional=functional_layer_json,
        infra=infrastructure_json,
        base_os=base_os_json,
        misc=miscellaneous_json,
        catalog=catalog,
        output_root=output_root,
    )


if __name__ == "__main__":
    parser = argparse.ArgumentParser(description='Generate adapter configs')
    parser.add_argument('--catalog', required=True, help='Path to input catalog JSON file')
    parser.add_argument('--schema', required=False, default=_DEFAULT_SCHEMA_PATH,
                        help='Path to catalog schema JSON file')
    parser.add_argument('--log-file', required=False, default=None, help='Path to log file; if not set, logs go to stderr')
    args = parser.parse_args()

    _configure_logging(log_file=args.log_file, log_level=logging.INFO)

    logger.info("Adapter config generation started for %s", args.catalog)

    try:
        generate_omnia_json_from_catalog(
            catalog_path=args.catalog,
            schema_path=args.schema,
            output_root="out/adapter/input/config",
        )

        logger.info("Adapter config generation completed for %s", args.catalog)
    except FileNotFoundError:
        logger.error("File not found during processing")
        sys.exit(ERROR_CODE_INPUT_NOT_FOUND)
    except ValidationError:
        sys.exit(ERROR_CODE_PROCESSING_ERROR)
    except Exception:
        logger.exception("Unexpected error while generating adapter configs")
        sys.exit(ERROR_CODE_PROCESSING_ERROR)


================================================
FILE: build_stream/core/catalog/adapter_policy.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Adapter to generate Omnia input JSONs from policy.

Transforms root JSONs from the main directory into target adapter config JSONs
using a declarative adapter policy file.
"""

import json
import os
import argparse
import logging
import shutil
from typing import Dict, List, Any, Optional, Tuple
from collections import Counter

import yaml

from jsonschema import ValidationError, validate

from .utils import _configure_logging, load_json_file
from . import adapter_policy_schema_consts as schema

logger = logging.getLogger(__name__)

_BASE_DIR = os.path.dirname(__file__)
_DEFAULT_POLICY_PATH = os.path.join(_BASE_DIR, "resources", "adapter_policy_default.json")
_DEFAULT_SCHEMA_PATH = os.path.join(_BASE_DIR, "resources", "AdapterPolicySchema.json")

_K8S_VERSION = "1.34.1"
_CSI_VERSION = "v2.15.0"


def _validate_input_policy_and_schema_paths(
    input_dir: str,
    policy_path: str,
    schema_path: str,
) -> None:
    if not os.path.isdir(input_dir):
        logger.error("Input directory not found: %s", input_dir)
        raise FileNotFoundError(input_dir)
    if not os.path.isfile(policy_path):
        logger.error("Adapter policy file not found: %s", policy_path)
        raise FileNotFoundError(policy_path)
    if not os.path.isfile(schema_path):
        logger.error("Adapter policy schema file not found: %s", schema_path)
        raise FileNotFoundError(schema_path)


def validate_policy_config(policy_config: Any, schema_config: Any, policy_path: str, schema_path: str) -> None:
    """Validate the adapter policy JSON against the schema."""
    try:
        validate(instance=policy_config, schema=schema_config)
    except ValidationError as exc:
        loc = "/".join(str(p) for p in exc.absolute_path) if exc.absolute_path else "<root>"
        raise ValueError(
            "Adapter policy validation failed.\n"
            f"Policy: {policy_path}\n"
            f"Schema: {schema_path}\n"
            f"At: {loc}\n"
            f"Error: {exc.message}"
        ) from exc


def discover_architectures(input_dir: str) -> List[str]:
    """Discover available architectures from input directory structure."""
    archs = []
    if os.path.isdir(input_dir):
        for item in os.listdir(input_dir):
            item_path = os.path.join(input_dir, item)
            if os.path.isdir(item_path):
                archs.append(item)
    return archs


def discover_os_versions(input_dir: str, arch: str) -> List[Tuple[str, str]]:
    """Discover OS families and versions for a given architecture.

    Returns list of (os_family, version) tuples.
    """
    results = []
    arch_path = os.path.join(input_dir, arch)
    if not os.path.isdir(arch_path):
        return results

    for os_family in os.listdir(arch_path):
        os_family_path = os.path.join(arch_path, os_family)
        if os.path.isdir(os_family_path):
            for version in os.listdir(os_family_path):
                version_path = os.path.join(os_family_path, version)
                if os.path.isdir(version_path):
                    results.append((os_family, version))
    return results


def _has_non_empty_cluster(target_data: Dict) -> bool:
    """Return True if any subgroup in target_data has a non-empty cluster list."""
    for subgroup_body in target_data.values():
        if subgroup_body.get(schema.CLUSTER):
            return True
    return False


def _collect_non_empty_subgroups(
    target_name: str,
    target_data: Dict,
) -> List[str]:
    """Return subgroup names that have non-empty cluster and differ from target_name."""
    return [
        key for key, body in target_data.items()
        if key != target_name and body.get(schema.CLUSTER)
    ]


def _extract_version_from_target_config(
    target_name: str,
    target_data: Dict[str, Dict]
) -> Optional[str]:
    """Extract version from target config package.
    
    Args:
        target_name: Name of the target (e.g., "ucx", "openmpi")
        target_data: Target configuration data
        
    Returns:
        Version string if found, None otherwise
    """
    if target_name not in target_data:
        return None
        
    # Get the cluster packages for this target
    cluster_data = target_data[target_name].get(schema.CLUSTER, [])
    if not cluster_data:
        return None
        
    # Find the main package (same name as target)
    for pkg in cluster_data:
        if pkg.get("package") == target_name:
            return pkg.get("version")
    
    return None


def generate_software_config(
    output_dir: str,
    os_family: str,
    os_version: str,
    all_arch_target_configs: Dict[str, Dict[str, Dict]],
) -> None:
    """Generate software_config.json from collected target configs.

    Args:
        output_dir: Root output directory (file written to output_dir/input/software_config.json).
        os_family: OS family string (e.g. "rhel").
        os_version: OS version string (e.g. "10.0").
        all_arch_target_configs: Mapping of arch -> {target_file -> {subgroup -> {cluster: [...]}}}.
    """
    # Discover all target files across architectures
    all_target_files: set = set()
    for arch_targets in all_arch_target_configs.values():
        all_target_files.update(arch_targets.keys())

    softwares: List[Dict] = []
    subgroup_sections: Dict[str, List[Dict]] = {}

    for target_file in sorted(all_target_files):
        target_name = target_file.removesuffix(".json")

        # Determine which arches have non-empty content for this target
        supported_arches: List[str] = []
        for arch in sorted(all_arch_target_configs.keys()):
            target_data = all_arch_target_configs[arch].get(target_file)
            if target_data and _has_non_empty_cluster(target_data):
                supported_arches.append(arch)

        if not supported_arches:
            continue

        entry: Dict[str, Any] = {"name": target_name}
        if "service_k8" in target_name:
            entry["version"] = _K8S_VERSION
        elif "csi" in target_name:
            entry["version"] = _CSI_VERSION
        elif target_name in ("ucx", "openmpi"):
            # Extract version from target config for UCX and OpenMPI
            version = None
            for arch in ("x86_64", "aarch64"):
                arch_configs = all_arch_target_configs.get(arch, {})
                target_data = arch_configs.get(target_file)
                if target_data:
                    version = _extract_version_from_target_config(target_name, target_data)
                    if version:
                        break
            if version:
                entry["version"] = version
        entry["arch"] = supported_arches
        softwares.append(entry)

        # Collect subgroups (union across arches, non-empty only, exclude target name)
        merged_subgroups: set = set()
        for arch in all_arch_target_configs:
            target_data = all_arch_target_configs[arch].get(target_file)
            if target_data:
                merged_subgroups.update(
                    _collect_non_empty_subgroups(target_name, target_data)
                )
        if merged_subgroups:
            subgroup_sections[target_name] = [
                {"name": sg} for sg in sorted(merged_subgroups)
            ]

    config: Dict[str, Any] = {
        "cluster_os_type": os_family,
        "cluster_os_version": os_version,
        "repo_config": "always",
        "softwares": softwares,
    }
    config.update(subgroup_sections)

    input_dir = os.path.join(output_dir, "input")
    os.makedirs(input_dir, exist_ok=True)
    output_path = os.path.join(input_dir, "software_config.json")

    # Write with compact single-line arrays to match expected format
    with open(output_path, "w", encoding="utf-8") as f:
        f.write("{\n")
        
        # Write top-level fields
        f.write(f'    "cluster_os_type": "{config["cluster_os_type"]}",\n')
        f.write(f'    "cluster_os_version": "{config["cluster_os_version"]}",\n')
        f.write(f'    "repo_config": "{config["repo_config"]}",\n')
        
        # Write softwares array (compact format)
        f.write('    "softwares": [\n')
        softwares = config["softwares"]
        for i, sw in enumerate(softwares):
            line = "        " + json.dumps(sw, separators=(",", ": "))
            if i < len(softwares) - 1:
                line += ","
            f.write(line + "\n")
        f.write('    ]')
        
        # Write subgroup sections (compact format)
        subgroup_keys = [k for k in config.keys() if k not in ("cluster_os_type", "cluster_os_version", "repo_config", "softwares")]
        for key in subgroup_keys:
            f.write(',\n')
            f.write(f'    "{key}": [\n')
            items = config[key]
            for i, item in enumerate(items):
                line = "        " + json.dumps(item, separators=(",", ": "))
                if i < len(items) - 1:
                    line += ","
                f.write(line + "\n")
            f.write('    ]')
        
        f.write("\n\n}\n")

    logger.info("Generated software_config.json at: %s", output_path)


def _package_key(pkg: Dict) -> Tuple[str, str, str]:
    """Generate a stable key for a package.

    For v2 derived operations (common package extraction), we want equivalence based on
    the full package definition except architecture. This avoids collisions for tarballs
    where repo_name is absent and uri differs.
    """

    def _hashable(v: Any) -> Any:
        if isinstance(v, (dict, list)):
            return json.dumps(v, sort_keys=True)
        return v

    return tuple(
        sorted(
            (k, _hashable(v))
            for k, v in pkg.items()
            if k != "architecture"
        )
    )


def transform_package(pkg: Dict, transform_config: Optional[Dict]) -> Dict:
    """Apply transformation rules to a package dict (excluding filter)."""
    if not transform_config:
        return pkg.copy()

    result = pkg.copy()

    # Auto-exclude versions for non-git packages, except UCX and OpenMPI
    package_type = result.get("type")
    package_name = result.get("package")
    if package_type != "git" and package_name not in ("ucx", "openmpi"):
        result.pop("version", None)

    exclude_fields = transform_config.get(schema.EXCLUDE_FIELDS, [])
    for field in exclude_fields:
        result.pop(field, None)

    rename_fields = transform_config.get(schema.RENAME_FIELDS, {})
    for old_name, new_name in rename_fields.items():
        if old_name in result:
            result[new_name] = result.pop(old_name)

    return result


def apply_substring_filter(
    packages: List[Dict],
    filter_config: Dict
) -> List[Dict]:
    """Filter packages by substring matching on a specified field."""
    field = filter_config.get(schema.FIELD, "package")
    values = filter_config.get(schema.VALUES, [])
    case_sensitive = filter_config.get(schema.CASE_SENSITIVE, False)

    if not values:
        return packages

    filtered = []
    for pkg in packages:
        field_value = pkg.get(field, "")
        if not case_sensitive:
            field_value = field_value.lower()
            check_values = [v.lower() for v in values]
        else:
            check_values = values

        if any(v in field_value for v in check_values):
            filtered.append(pkg)

    return filtered


def apply_allowlist_filter(
    packages: List[Dict],
    filter_config: Dict,
) -> List[Dict]:
    field = filter_config.get(schema.FIELD, "package")
    values = filter_config.get(schema.VALUES, [])
    case_sensitive = filter_config.get(schema.CASE_SENSITIVE, False)

    if not values:
        return packages

    if not case_sensitive:
        allowed = {str(v).lower() for v in values}
    else:
        allowed = {str(v) for v in values}

    result: List[Dict] = []
    for pkg in packages:
        field_value = pkg.get(field)
        if field_value is None:
            continue
        s = str(field_value)
        if not case_sensitive:
            s = s.lower()
        if s in allowed:
            result.append(pkg)
    return result


def apply_field_in_filter(
    packages: List[Dict],
    filter_config: Dict,
) -> List[Dict]:
    field = filter_config.get(schema.FIELD)
    values = filter_config.get(schema.VALUES, [])
    case_sensitive = filter_config.get(schema.CASE_SENSITIVE, False)

    if not field or not values:
        return packages

    if not case_sensitive:
        allowed = {str(v).lower() for v in values}
    else:
        allowed = {str(v) for v in values}

    result: List[Dict] = []
    for pkg in packages:
        field_value = pkg.get(field)
        if field_value is None:
            continue

        if isinstance(field_value, list):
            vals = [str(v) for v in field_value]
            if not case_sensitive:
                vals = [v.lower() for v in vals]
            if any(v in allowed for v in vals):
                result.append(pkg)
        else:
            s = str(field_value)
            if not case_sensitive:
                s = s.lower()
            if s in allowed:
                result.append(pkg)
    return result


def apply_any_of_filter(
    packages: List[Dict],
    source_data: Dict,
    source_key: str,
    filter_config: Dict,
) -> List[Dict]:
    filters = filter_config.get(schema.FILTERS, [])
    if not filters:
        return packages

    result: List[Dict] = []
    for pkg in packages:
        for sub_filter in filters:
            filtered = apply_filter([pkg], source_data, source_key, sub_filter)
            if filtered:
                result.append(pkg)
                break
    return result


def compute_common_packages(
    source_data: Dict,
    compare_keys: List[str],
    min_occurrences: int = 2
) -> Tuple[set, Dict[Tuple, Dict]]:
    """Compute packages that appear in multiple source keys.

    Returns:
        - Set of common package keys
        - Dict mapping package key to package dict
    """
    key_counts: Counter = Counter()
    key_to_pkg: Dict[Tuple, Dict] = {}

    for source_key in compare_keys:
        if source_key not in source_data:
            continue

        feature = source_data[source_key]
        packages = feature.get(schema.PACKAGES, [])

        seen_in_this_key: set = set()
        for pkg in packages:
            k = _package_key(pkg)
            key_to_pkg.setdefault(k, pkg)
            if k not in seen_in_this_key:
                seen_in_this_key.add(k)
                key_counts[k] += 1

    common_keys = {k for k, count in key_counts.items() if count >= min_occurrences}
    return common_keys, key_to_pkg


def apply_extract_common_filter(
    packages: List[Dict],
    source_data: Dict,
    filter_config: Dict
) -> List[Dict]:
    """Extract packages that are common across multiple source keys."""
    compare_keys = filter_config.get(schema.COMPARE_KEYS, [])
    min_occurrences = filter_config.get(schema.MIN_OCCURRENCES, 2)

    if not compare_keys:
        return packages

    common_keys, key_to_pkg = compute_common_packages(source_data, compare_keys, min_occurrences)

    # Return common packages in deterministic order
    result = []
    seen = set()
    for k, pkg in key_to_pkg.items():
        if k in common_keys and k not in seen:
            seen.add(k)
            result.append(pkg)

    return result


def apply_extract_unique_filter(
    packages: List[Dict],
    source_data: Dict,
    _source_key: str,
    filter_config: Dict
) -> List[Dict]:
    """Extract packages unique to the current source key (not common with others)."""
    compare_keys = filter_config.get(schema.COMPARE_KEYS, [])
    min_occurrences = filter_config.get(schema.MIN_OCCURRENCES, 2)

    if not compare_keys:
        return packages

    common_keys, _ = compute_common_packages(source_data, compare_keys, min_occurrences)

    # Return packages from current source_key that are NOT in common
    return [pkg for pkg in packages if _package_key(pkg) not in common_keys]


def apply_filter(
    packages: List[Dict],
    _source_data: Dict,
    _source_key: str,
    filter_config: Optional[Dict]
) -> List[Dict]:
    """Apply filter based on filter type."""
    if not filter_config:
        return packages

    filter_type = filter_config.get(schema.TYPE)

    if filter_type == schema.SUBSTRING_FILTER:
        return apply_substring_filter(packages, filter_config)

    if filter_type == schema.ALLOWLIST_FILTER:
        return apply_allowlist_filter(packages, filter_config)

    if filter_type == schema.FIELD_IN_FILTER:
        return apply_field_in_filter(packages, filter_config)

    if filter_type == schema.ANY_OF_FILTER:
        return apply_any_of_filter(packages, _source_data, _source_key, filter_config)

    logger.warning("Unknown/unsupported filter type in v2: %s", filter_type)
    return packages


def merge_transform(base: Optional[Dict], override: Optional[Dict]) -> Optional[Dict]:
    """Merge two transform dicts where override wins."""
    if not base and not override:
        return None
    if not base:
        return override
    if not override:
        return base
    merged = base.copy()
    merged.update(override)
    return merged


def compute_common_keys_from_roles(
    roles: Dict[str, List[Dict]],
    from_keys: List[str],
    min_occurrences: int
) -> set:
    """Compute package keys that are common across the given target roles."""
    key_counts: Counter = Counter()
    for role_key in from_keys:
        pkgs = roles.get(role_key, [])
        seen_in_role: set = set()
        for pkg in pkgs:
            k = _package_key(pkg)
            if k not in seen_in_role:
                seen_in_role.add(k)
                key_counts[k] += 1
    return {k for k, count in key_counts.items() if count >= min_occurrences}


def derive_common_role(
    target_roles: Dict[str, List[Dict]],
    derived_key: str,
    from_keys: List[str],
    min_occurrences: int = 2,
    remove_from_sources: bool = True
) -> None:
    """Derive a common role and optionally remove common packages from source roles."""
    common_keys = compute_common_keys_from_roles(target_roles, from_keys, min_occurrences)

    common_pkgs: List[Dict] = []
    seen: set = set()
    for role_key in from_keys:
        for pkg in target_roles.get(role_key, []):
            k = _package_key(pkg)
            if k in common_keys and k not in seen:
                seen.add(k)
                common_pkgs.append(pkg)

    target_roles[derived_key] = common_pkgs

    if remove_from_sources:
        for role_key in from_keys:
            target_roles[role_key] = [
                pkg for pkg in target_roles.get(role_key, [])
                if _package_key(pkg) not in common_keys
            ]


def check_conditions(
    conditions: Optional[Dict],
    arch: str,
    os_family: str,
    os_version: str
) -> bool:
    """Check if mapping conditions are satisfied."""
    if not conditions:
        return True

    if schema.ARCHITECTURES in conditions:
        if arch not in conditions[schema.ARCHITECTURES]:
            return False

    if schema.OS_FAMILIES in conditions:
        if os_family not in conditions[schema.OS_FAMILIES]:
            return False

    if schema.OS_VERSIONS in conditions:
        if os_version not in conditions[schema.OS_VERSIONS]:
            return False

    return True


def process_target_spec(
    target_file: str,
    target_spec: Dict,
    source_files: Dict[str, Dict],
    target_configs: Dict[str, Dict],
    arch: str,
    os_family: str,
    os_version: str
) -> None:
    """Build a single target file config using v2 target-centric spec."""
    conditions = target_spec.get(schema.CONDITIONS)
    if not check_conditions(conditions, arch, os_family, os_version):
        logger.debug("Skipping target %s (conditions not met)", target_file)
        return

    target_level_transform = target_spec.get(schema.TRANSFORM)

    target_roles: Dict[str, List[Dict]] = {}

    for source_spec in target_spec.get(schema.SOURCES, []):
        source_file = source_spec.get(schema.SOURCE_FILE)
        if not source_file or source_file not in source_files:
            logger.debug("Source file %s not loaded/available", source_file)
            continue

        source_data = source_files[source_file]

        for pull in source_spec.get(schema.PULLS, []):
            source_key = pull.get(schema.SOURCE_KEY)
            if not source_key or source_key not in source_data:
                logger.debug("Source key '%s' not found in %s", source_key, source_file)
                continue

            target_key = pull.get(schema.TARGET_KEY) or source_key
            filter_config = pull.get(schema.FILTER)
            pull_transform = merge_transform(target_level_transform, pull.get(schema.TRANSFORM))

            packages = source_data[source_key].get(schema.PACKAGES, [])
            packages = apply_filter(packages, source_data, source_key, filter_config)
            packages = [transform_package(pkg, pull_transform) for pkg in packages]

            if target_key in target_roles:
                target_roles[target_key].extend(packages)
            else:
                target_roles[target_key] = packages

    for derived in target_spec.get(schema.DERIVED, []) or []:
        derived_key = derived.get(schema.TARGET_KEY)
        operation = derived.get(schema.OPERATION, {})
        op_type = operation.get(schema.TYPE)
        if op_type != schema.EXTRACT_COMMON_OPERATION:
            logger.warning("Unsupported derived operation type: %s", op_type)
            continue

        from_keys = operation.get(schema.FROM_KEYS, [])
        min_occurrences = operation.get(schema.MIN_OCCURRENCES, 2)
        remove_from_sources = operation.get(schema.REMOVE_FROM_SOURCES, True)

        if derived_key and from_keys:
            derive_common_role(
                target_roles=target_roles,
                derived_key=derived_key,
                from_keys=from_keys,
                min_occurrences=min_occurrences,
                remove_from_sources=remove_from_sources
            )

    if target_roles:
        # Special validation for UCX and OpenMPI targets
        target_file_name = os.path.basename(target_file).replace('.json', '')
        
        # Check if we should generate this target
        should_generate = True
        
        if target_file_name in ['ucx', 'openmpi']:
            # Check if main package exists for these specific targets
            main_package_found = False
            for target_key, packages in target_roles.items():
                package_names = [pkg.get("package") for pkg in packages]
                if target_file_name in package_names:
                    main_package_found = True
                    break
            
            # Skip generation only for UCX/OpenMPI if main package missing
            if not main_package_found:
                logger.debug("Skipping %s: main package '%s' not found", target_file, target_file_name)
                should_generate = False
        
        # Generate target config only if validation passes
        if should_generate:
            target_configs[target_file] = {
                role_key: {schema.CLUSTER: pkgs}
                for role_key, pkgs in target_roles.items()
            }


def write_config_file(file_path: str, config: Dict) -> None:
    """Write a config JSON file with proper formatting."""
    os.makedirs(os.path.dirname(file_path), exist_ok=True)

    with open(file_path, "w", encoding="utf-8") as out_file:
        out_file.write("{\n")

        items = list(config.items())
        for i, (top_key, body) in enumerate(items):
            out_file.write(f'  "{top_key}": {{\n')
            out_file.write(f'    "{schema.CLUSTER}": [\n')

            pkgs = body.get(schema.CLUSTER, [])
            for j, pkg in enumerate(pkgs):
                line = "      " + json.dumps(pkg, separators=(", ", ": "))
                if j < len(pkgs) - 1:
                    line += ","
                out_file.write(line + "\n")

            out_file.write("    ]\n")
            out_file.write("  }")
            if i < len(items) - 1:
                out_file.write(",\n")
            else:
                out_file.write("\n")

        out_file.write("}\n")


def generate_configs_from_policy(
    input_dir: str,
    output_dir: str,
    policy_path: str = _DEFAULT_POLICY_PATH,
    schema_path: str = _DEFAULT_SCHEMA_PATH,
    *,
    log_file: Optional[str] = None,
    configure_logging: bool = False,
    log_level: int = logging.INFO,
) -> None:
    """Main function to generate adapter configs using adapter policy.

    Args:
        input_dir: Path to input directory (e.g., poc/milestone-1/out1/main)
        output_dir: Path to output directory (e.g., poc/milestone-1/out1/adapter/input/config)
        policy_path: Path to adapter policy JSON file
        schema_path: Path to adapter policy schema JSON file
        software_config_path: Optional path to software_config.json to copy to output
        log_file: Optional path to log file
        configure_logging: Whether to configure logging
        log_level: Logging level
    """
    if configure_logging:
        _configure_logging(log_file=log_file, log_level=log_level)

    _validate_input_policy_and_schema_paths(input_dir, policy_path, schema_path)

    policy_config = load_json_file(policy_path)
    schema_config = load_json_file(schema_path)
    validate_policy_config(policy_config, schema_config, policy_path=policy_path, schema_path=schema_path)
    targets = policy_config.get(schema.TARGETS, {})

    logger.info("Loaded %d target(s) from %s", len(targets), policy_path)

    # Discover architectures
    architectures = discover_architectures(input_dir)
    
    if not architectures:
        logger.warning("No architectures discovered under input directory: %s", input_dir)
        return
        
    logger.info("Discovered architectures: %s", architectures)

    all_arch_target_configs: Dict[str, Dict[str, Dict]] = {}
    resolved_os_family: Optional[str] = None
    resolved_os_version: Optional[str] = None

    for arch in architectures:
        os_versions = discover_os_versions(input_dir, arch)

        for os_family, version in os_versions:
            logger.info("Processing: arch=%s, os=%s, version=%s", arch, os_family, version)

            if resolved_os_family is None:
                resolved_os_family = os_family
                resolved_os_version = version

            source_dir = os.path.join(input_dir, arch, os_family, version)
            target_dir = os.path.join(output_dir, "input", "config", arch, os_family, version)

            if not os.path.isdir(source_dir):
                logger.warning("Source directory not found, skipping: %s", source_dir)
                continue

            source_files: Dict[str, Dict] = {}
            for filename in os.listdir(source_dir):
                if filename.endswith(".json"):
                    file_path = os.path.join(source_dir, filename)
                    source_files[filename] = load_json_file(file_path)
                    logger.debug("Loaded source file: %s", filename)

            target_configs: Dict[str, Dict] = {}

            for target_file, target_spec in targets.items():
                process_target_spec(
                    target_file=target_file,
                    target_spec=target_spec,
                    source_files=source_files,
                    target_configs=target_configs,
                    arch=arch,
                    os_family=os_family,
                    os_version=version
                )

            for target_file, data in target_configs.items():
                if data:
                    file_path = os.path.join(target_dir, target_file)
                    write_config_file(file_path, data)
                    logger.info("Written: %s", file_path)

            all_arch_target_configs[arch] = target_configs

    generate_software_config(
        output_dir=output_dir,
        os_family=resolved_os_family or "",
        os_version=resolved_os_version or "",
        all_arch_target_configs=all_arch_target_configs,
    )


def main():
    """CLI entry point."""
    parser = argparse.ArgumentParser(
        description="Generate adapter configs from input JSONs using adapter policy"
    )
    parser.add_argument(
        "--input-dir",
        required=True,
        help="Path to input directory containing source JSONs (e.g., out1/main)"
    )
    parser.add_argument(
        "--output-dir",
        required=True,
        help="Path to output directory for generated configs (e.g., out1/adapter/input/config)"
    )
    parser.add_argument(
        "--policy",
        default=_DEFAULT_POLICY_PATH,
        help="Path to adapter policy JSON file"
    )
    parser.add_argument(
        "--schema",
        default=_DEFAULT_SCHEMA_PATH,
        help="Path to adapter policy schema JSON file"
    )
    parser.add_argument(
        "--log-file",
        required=False,
        default=None,
        help="Path to log file; if not set, logs go to stderr"
    )
    parser.add_argument(
        "--log-level",
        default="INFO",
        choices=["DEBUG", "INFO", "WARNING", "ERROR"],
        help="Logging level"
    )

    args = parser.parse_args()

    _configure_logging(
        log_file=args.log_file,
        log_level=getattr(logging, args.log_level),
    )

    logger.info("Starting adapter policy generation")
    logger.info("Input directory: %s", args.input_dir)
    logger.info("Output directory: %s", args.output_dir)
    logger.info("Policy file: %s", args.policy)

    generate_configs_from_policy(
        input_dir=args.input_dir,
        output_dir=args.output_dir,
        policy_path=args.policy,
        schema_path=args.schema,
        configure_logging=False,
    )

    logger.info("Adapter config generation completed")


if __name__ == "__main__":
    main()


================================================
FILE: build_stream/core/catalog/adapter_policy_schema_consts.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""String constants for adapter policy schema keys."""

TARGETS = "targets"
SOURCES = "sources"
SOURCE_FILE = "source_file"
PULLS = "pulls"
SOURCE_KEY = "source_key"
TARGET_KEY = "target_key"
FILTER = "filter"
TRANSFORM = "transform"
CONDITIONS = "conditions"
DERIVED = "derived"
OPERATION = "operation"
FROM_KEYS = "from_keys"
MIN_OCCURRENCES = "min_occurrences"
REMOVE_FROM_SOURCES = "remove_from_sources"

PACKAGES = "packages"

TYPE = "type"

SUBSTRING_FILTER = "substring"
ALLOWLIST_FILTER = "allowlist"
FIELD_IN_FILTER = "field_in"
ANY_OF_FILTER = "any_of"
EXTRACT_COMMON_OPERATION = "extract_common"

CLUSTER = "cluster"

EXCLUDE_FIELDS = "exclude_fields"
RENAME_FIELDS = "rename_fields"

FIELD = "field"
VALUES = "values"
CASE_SENSITIVE = "case_sensitive"
FILTERS = "filters"
COMPARE_KEYS = "compare_keys"

ARCHITECTURES = "architectures"
OS_FAMILIES = "os_families"
OS_VERSIONS = "os_versions"


================================================
FILE: build_stream/core/catalog/exceptions.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Domain exceptions for Catalog operations."""

from typing import Optional


class CatalogParseError(Exception):
    """Base exception for catalog parsing failures."""

    def __init__(self, message: str, correlation_id: Optional[str] = None) -> None:
        super().__init__(message)
        self.message = message
        self.correlation_id = correlation_id


class InvalidFileFormatError(CatalogParseError):
    """Uploaded file has an invalid format (not .json)."""


class InvalidJSONError(CatalogParseError):
    """JSON content is malformed or not a dictionary."""


class CatalogSchemaValidationError(CatalogParseError):
    """Catalog JSON fails schema validation."""

    def __init__(
        self,
        message: str,
        schema_path: str = "",
        correlation_id: Optional[str] = None,
    ) -> None:
        super().__init__(message, correlation_id=correlation_id)
        self.schema_path = schema_path


class FileTooLargeError(CatalogParseError):
    """Uploaded file exceeds the maximum allowed size."""

    def __init__(
        self,
        actual_size: int,
        max_size: int,
        correlation_id: Optional[str] = None,
    ) -> None:
        super().__init__(
            f"File size {actual_size} bytes exceeds maximum {max_size} bytes",
            correlation_id=correlation_id,
        )
        self.actual_size = actual_size
        self.max_size = max_size


class AdapterPolicyValidationError(CatalogParseError):
    """Adapter policy fails schema validation."""

    def __init__(
        self,
        message: str,
        policy_path: str = "",
        correlation_id: Optional[str] = None,
    ) -> None:
        super().__init__(message, correlation_id=correlation_id)
        self.policy_path = policy_path


class ConfigGenerationError(CatalogParseError):
    """Omnia config generation fails during adapter transformation."""


================================================
FILE: build_stream/core/catalog/generator.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Catalog parser generator.

Provides programmatic APIs and a CLI to generate feature-list JSON files from a
catalog, and to load/validate feature-list JSONs.
"""

import argparse
from dataclasses import dataclass
import json
import logging
import os
import sys
from typing import Dict, List, Optional, Tuple

from jsonschema import ValidationError, validate

from .models import Catalog
from .parser import ParseCatalog
from .utils import _configure_logging, load_json_file

logger = logging.getLogger(__name__)

_BASE_DIR = os.path.dirname(__file__)
_DEFAULT_SCHEMA_PATH = os.path.join(_BASE_DIR, "resources", "CatalogSchema.json")
_ROOT_LEVEL_SCHEMA_PATH = os.path.join(_BASE_DIR, "resources", "RootLevelSchema.json")

ERROR_CODE_INPUT_NOT_FOUND = 2
ERROR_CODE_PROCESSING_ERROR = 3

# This code generates JSON files
# i.e baseos.json, infrastructure.json, functional_layer.json, miscellaneous.json
# for a given catalog

def _validate_catalog_and_schema_paths(catalog_path: str, schema_path: str) -> None:
    """Validate that the catalog and schema paths exist.

    Raises FileNotFoundError if either path does not exist.
    """

    if not os.path.isfile(catalog_path):
        logger.error("Catalog file not found: %s", catalog_path)
        raise FileNotFoundError(catalog_path)
    if not os.path.isfile(schema_path):
        logger.error("Schema file not found: %s", schema_path)
        raise FileNotFoundError(schema_path)


def _arch_suffix(architecture) -> str:
    """Return a single-arch suffix from a catalog Package.architecture field.

    Handles both legacy string values and new List[str] values.
    """
    if isinstance(architecture, list):
        if not architecture:
            return ""
        arch = architecture[0]
    else:
        arch = architecture
    return str(arch)


@dataclass
class Package:
    """Represents a package entry inside a generated FeatureList JSON."""

    package: str
    version: Optional[str]
    type: str
    repo_name: str
    architecture: List[str]
    uri: Optional[str] = None
    tag: Optional[str] = None
    sources: Optional[List[dict]] = None


@dataclass
class Feature:
    """Represents a single feature/role entry containing a list of packages."""

    feature_name: str
    packages: List[Package]


@dataclass
class FeatureList:
    """Collection of features keyed by feature/role name."""

    features: Dict[str, Feature]


def _filter_featurelist_for_arch(feature_list: FeatureList, arch: str) -> FeatureList:
    """Return a FeatureList containing only packages for the given arch.

    Arch is taken from the Package.architecture list.
    """
    filtered_features: Dict[str, Feature] = {}
    for name, feature in feature_list.features.items():
        narrowed_pkgs: List[Package] = []
        for p in feature.packages:
            if arch in getattr(p, "architecture", []):
                # Derive repo_name and uri from the catalog Sources metadata, if
                # present, for this specific architecture.
                repo_name = ""
                uri = getattr(p, "uri", None)
                if getattr(p, "sources", None):
                    for src in p.sources:
                        if src.get("Architecture") == arch:
                            if "RepoName" in src:
                                repo_name = src["RepoName"]
                            if "Uri" in src:
                                uri = src["Uri"]
                            break

                narrowed_pkgs.append(
                    Package(
                        package=p.package,
                        version=getattr(p, "version", None),
                        type=p.type,
                        repo_name=repo_name,
                        architecture=[arch],
                        uri=uri,
                        tag=p.tag,
                        sources=p.sources,
                    )
                )
        filtered_features[name] = Feature(feature_name=name, packages=narrowed_pkgs)
    return FeatureList(features=filtered_features)


def _discover_arch_os_version_from_catalog(catalog: Catalog) -> List[Tuple[str, str, str]]:
    """Discover distinct (arch, os_name, version) combinations in the Catalog.

    os_name is returned in lowercase (e.g. "rhel"), version as-is.
    """

    combos: set[Tuple[str, str, str]] = set()

    def _add_from_packages(packages):
        for pkg in packages:
            for os_entry in pkg.supported_os:
                parts = os_entry.split(" ", 1)
                if len(parts) == 2:
                    os_name_raw, os_ver = parts
                else:
                    os_name_raw, os_ver = os_entry, ""
                os_name = os_name_raw.lower()

                for arch in pkg.architecture:
                    combos.add((arch, os_name, os_ver))

    _add_from_packages(catalog.functional_packages)
    _add_from_packages(catalog.os_packages)

    combos_sorted = sorted(combos)
    logger.debug(
        "Discovered %d (arch, os, version) combinations in catalog %s",
        len(combos_sorted),
        getattr(catalog, "name", "<unknown>"),
    )
    return combos_sorted


def generate_functional_layer_json(catalog: Catalog) -> FeatureList:
    """
    Generates a JSON file containing the functional layer from a given catalog object.

    Args:
    - catalog (Catalog): The catalog object to generate the functional layer from.

    Returns:
    - FeatureList: The generated JSON data
    """
    output_json = FeatureList(features={})

    for layer in catalog.functional_layer:
        feature_json = Feature(
            feature_name=layer["Name"],
            packages=[],
        )

        for pkg_id in layer["FunctionalPackages"]:
            pkg = next((pkg for pkg in catalog.functional_packages if pkg.id == pkg_id), None)
            if pkg:
                feature_json.packages.append(
                    Package(
                        package=pkg.name,
                        version=pkg.version,
                        type=pkg.type,
                        repo_name="",
                        architecture=pkg.architecture,
                        uri=None,
                        tag=getattr(pkg, "tag", None),
                        sources=pkg.sources,
                    )
                )

        output_json.features[feature_json.feature_name] = feature_json

    return output_json


def generate_infrastructure_json(catalog: Catalog) -> FeatureList:
    """
    Generates a JSON file containing the infrastructure from a given catalog object.

    Args:
    - catalog (Catalog): The catalog object to generate the infrastructure from.

    Returns:
    - FeatureList: The generated JSON data
    """
    output_json = FeatureList(features={})

    for infra in catalog.infrastructure:
        feature_json = Feature(
            feature_name=infra["Name"],
            packages=[],
        )

        for pkg_id in infra["InfrastructurePackages"]:
            pkg = next((pkg for pkg in catalog.infrastructure_packages if pkg.id == pkg_id), None)
            if pkg:
                feature_json.packages.append(
                    Package(
                        package=pkg.name,
                        version=pkg.version,
                        type=pkg.type,
                        repo_name="",
                        architecture=pkg.architecture,
                        uri=None,
                        tag=getattr(pkg, "tag", None),
                        sources=pkg.sources,
                    )
                )

        output_json.features[feature_json.feature_name] = feature_json

    return output_json


def generate_drivers_json(catalog: Catalog) -> FeatureList:
    """
    Generates a JSON file containing the drivers from a given catalog object.

    Args:
    - catalog (Catalog): The catalog object to generate the drivers from.

    Returns:
    - FeatureList: The generated JSON data
    """
    output_json = FeatureList(features={})

    # Map driver package IDs -> Driver objects parsed from DriverPackages.
    drivers_by_id: Dict[str, any] = {drv.id: drv for drv in catalog.drivers}

    # If no grouping is present (backward compatibility), fall back to a single
    # "Drivers" feature containing all drivers.
    if not getattr(catalog, "drivers_layer", []):
        feature_json = Feature(
            feature_name="Drivers",
            packages=[]
        )
        for driver in catalog.drivers:
            feature_json.packages.append(
                Package(
                    package=driver.name,
                    version=driver.version,
                    type=driver.type,
                    repo_name="",
                    architecture=driver.architecture,
                    uri=None,
                    tag=None,
                    sources=None,
                )
            )
        output_json.features[feature_json.feature_name] = feature_json
        return output_json

    # Respect grouping similar to FunctionalLayer: one Feature per driver group.
    for group in catalog.drivers_layer:
        group_name = group.get("Name")
        driver_ids = group.get("DriverPackages", [])
        if not group_name or not driver_ids:
            continue

        feature_json = Feature(
            feature_name=group_name,
            packages=[]
        )

        for driver_id in driver_ids:
            driver = drivers_by_id.get(driver_id)
            if not driver:
                continue

            feature_json.packages.append(
                Package(
                    package=driver.name,
                    version=driver.version,
                    type=driver.type,
                    repo_name="",
                    architecture=driver.architecture,
                    uri=None,
                    tag=None,
                    sources=None,
                )
            )

        output_json.features[feature_json.feature_name] = feature_json

    return output_json


def generate_base_os_json(catalog: Catalog) -> FeatureList:
    """
    Generates a JSON file containing the base OS from a given catalog object.

    Args:
    - catalog (Catalog): The catalog object to generate the base OS from.

    Returns:
    - FeatureList: The generated JSON data
    """
    output_json = FeatureList(features={})

    feature_json = Feature(
        feature_name="Base OS",
        packages=[]
    )

    for entry in catalog.base_os:
        for pkg_id in entry["osPackages"]:
            pkg = next((pkg for pkg in catalog.os_packages if pkg.id == pkg_id), None)
            if pkg:
                feature_json.packages.append(
                    Package(
                        package=pkg.name,
                        version=pkg.version,
                        type=pkg.type,
                        repo_name="",
                        architecture=pkg.architecture,
                        uri=None,
                        tag=getattr(pkg, "tag", None),
                        sources=pkg.sources,
                    )
                )

    output_json.features[feature_json.feature_name] = feature_json

    return output_json


def generate_miscellaneous_json(catalog: Catalog) -> FeatureList:
    """Generate a FeatureList for the Miscellaneous group, if present.

    The catalog is expected to carry a Miscellaneous array of package IDs,
    referencing FunctionalPackages. This creates a single feature named
    "Miscellaneous" containing those packages.
    """
    output_json = FeatureList(features={})

    feature_json = Feature(
        feature_name="Miscellaneous",
        packages=[],
    )

    misc_ids = getattr(catalog, "miscellaneous", [])
    for pkg_id in misc_ids:
        pkg = next((pkg for pkg in catalog.functional_packages if pkg.id == pkg_id), None)
        if not pkg:
            continue

        feature_json.packages.append(
            Package(
                package=pkg.name,
                version=pkg.version,
                type=pkg.type,
                repo_name="",
                architecture=pkg.architecture,
                uri=None,
                tag=getattr(pkg, "tag", None),
                sources=pkg.sources,
            )
        )

    output_json.features[feature_json.feature_name] = feature_json

    return output_json


def _package_common_dict(pkg: Package) -> Dict:
    """Common dict representation for a Package (no architecture).

    Shared between generator and adapter to keep JSON field formatting
    consistent for package, type, repo_name, uri, and tag.
    """
    data: Dict = {"package": pkg.package, "type": pkg.type}
    if getattr(pkg, "version", None):
        data["version"] = pkg.version
    if getattr(pkg, "repo_name", ""):
        data["repo_name"] = pkg.repo_name
    if getattr(pkg, "uri", None) is not None:
        data["uri"] = pkg.uri
    if getattr(pkg, "tag", "") and pkg.tag != "":
        data["tag"] = pkg.tag
    return data


def _package_to_json_dict(pkg: Package) -> Dict:
    data = _package_common_dict(pkg)
    data["architecture"] = pkg.architecture
    return data


def _package_from_json_dict(data: Dict) -> Package:
    return Package(
        package=data["package"],
        version=data.get("version"),
        type=data["type"],
        repo_name=data.get("repo_name", ""),
        architecture=data.get("architecture", []),
        uri=data.get("uri"),
        tag=data.get("tag"),
    )


def serialize_json(feature_list: FeatureList, output_path: str):
    """
    Serializes the output JSON data to a file.

    Args:
    - feature_list (FeatureList): The feature list data to serialize.
    - output_path (str): The path to write the serialized JSON file to.
    """
    # Custom pretty-printer so that:
    #   - Overall JSON is nicely indented
    #   - Each package entry inside "packages" is a single-line JSON object
    logger.info(
        "Writing FeatureList with %d feature(s) to %s",
        len(feature_list.features),
        output_path,
    )
    with open(output_path, "w", encoding="utf-8") as out_file:
        out_file.write("{\n")

        items = list(feature_list.features.items())
        for i, (feature_name, feature) in enumerate(items):
            # Feature key
            out_file.write(f"  {json.dumps(feature_name)}: {{\n")
            out_file.write("    \"packages\": [\n")

            pkgs = feature.packages
            for j, pkg in enumerate(pkgs):
                pkg_dict = _package_to_json_dict(pkg)
                line = "      " + json.dumps(pkg_dict, separators=(", ", ": "))
                if j < len(pkgs) - 1:
                    line += ","
                out_file.write(line + "\n")

            out_file.write("    ]\n")
            out_file.write("  }")
            if i < len(items) - 1:
                out_file.write(",\n")
            else:
                out_file.write("\n")

        out_file.write("}\n")


def deserialize_json(input_path: str) -> FeatureList:
    """
    Deserializes a JSON file to output JSON data.

    Args:
    - input_path (str): The path to read the JSON file from.

    Returns:
    - FeatureList: The deserialized JSON data
    """
    json_data = load_json_file(input_path)

    logger.debug("Deserializing FeatureList from %s", input_path)

    feature_list = FeatureList(
        features={
            feature_name: Feature(
                feature_name=feature_name,
                packages=[
                    _package_from_json_dict(pkg)
                    for pkg in feature_body.get("packages", [])
                ],
            )
            for feature_name, feature_body in json_data.items()
        }
    )

    logger.info(
        "Deserialized FeatureList with %d feature(s) from %s",
        len(feature_list.features),
        input_path,
    )

    return feature_list


def get_functional_layer_roles_from_file(
    functional_layer_json_path: str,
    *,
    configure_logging: bool = False,
    log_file: Optional[str] = None,
    log_level: int = logging.INFO,
) -> List[str]:
    """Return role names (top-level keys) from a functional_layer.json file.

    The input JSON is validated against RootLevelSchema.json before it is
    deserialized.
    """
    if configure_logging:
        _configure_logging(log_file=log_file, log_level=log_level)

    logger.info("get_functional_layer_roles_from_file started for %s", functional_layer_json_path)
    logger.debug("Loading root-level schema from %s", _ROOT_LEVEL_SCHEMA_PATH)
    schema = load_json_file(_ROOT_LEVEL_SCHEMA_PATH)

    logger.debug("Validating JSON")
    json_data = load_json_file(functional_layer_json_path)

    try:
        validate(instance=json_data, schema=schema)
    except ValidationError as exc:
        logger.error(
            "JSON validation failed for %s",
            functional_layer_json_path,
        )
        raise
    logger.info("JSON validation succeeded")

    feature_list = deserialize_json(functional_layer_json_path)
    logger.debug("Populating roles info")
    roles = list(feature_list.features.keys())
    logger.info(
        "get_functional_layer_roles_from_file completed for %s (roles=%d)",
        functional_layer_json_path,
        len(roles),
    )
    return roles


def get_package_list(
    functional_layer_json_path: str,
    role: Optional[str] = None,
    *,
    configure_logging: bool = False,
    log_file: Optional[str] = None,
    log_level: int = logging.INFO,
) -> List[Dict]:
    """Return packages for a specific role or all roles from a functional_layer.json file.

    The input JSON is validated against RootLevelSchema.json before it is
    deserialized.

    Args:
        functional_layer_json_path: Path to the functional_layer.json file.
        role: Optional role identifier. If None, returns packages for all roles.
        configure_logging: If True, configure logging with optional file output.
        log_file: Path to log file; if not set, logs go to stderr.
        log_level: Logging level (default: logging.INFO).

    Returns:
        List of role objects, each containing:
        - roleName: str
        - packages: List[Dict] with keys: name, type, repo_name, architecture, uri, tag

    Raises:
        FileNotFoundError: If the JSON file does not exist.
        ValidationError: If the JSON fails schema validation.
        ValueError: If the specified role does not exist.
    """
    if configure_logging:
        _configure_logging(log_file=log_file, log_level=log_level)

    logger.info(
        "get_package_list started for %s (role=%s)",
        functional_layer_json_path,
        role if role else "all",
    )

    logger.debug("Checking if file exists: %s", functional_layer_json_path)
    if not os.path.isfile(functional_layer_json_path):
        logger.error("File not found: %s", functional_layer_json_path)
        raise FileNotFoundError(functional_layer_json_path)

    logger.debug("Loading root-level schema from %s", _ROOT_LEVEL_SCHEMA_PATH)
    with open(_ROOT_LEVEL_SCHEMA_PATH, "r", encoding="utf-8") as f:
        schema = json.load(f)

    logger.debug("Loading and validating JSON from %s", functional_layer_json_path)
    with open(functional_layer_json_path, "r", encoding="utf-8") as f:
        json_data = json.load(f)

    try:
        validate(instance=json_data, schema=schema)
    except ValidationError as exc:
        logger.error(
            "JSON validation failed for %s",
            functional_layer_json_path,
        )
        raise
    logger.info("JSON validation succeeded for %s", functional_layer_json_path)

    logger.debug("Deserializing feature list from %s", functional_layer_json_path)
    feature_list = deserialize_json(functional_layer_json_path)

    available_roles = list(feature_list.features.keys())
    logger.debug("Available roles: %s", available_roles)

    if role is not None:
        logger.debug("Filtering for specific role: %s", role)
        if role == "":
            logger.error(
                "Invalid role input: empty string for %s (available roles: %s)",
                functional_layer_json_path,
                available_roles,
            )
            raise ValueError("Role must be a non-empty string")
        # Case-insensitive role matching
        role_lower = role.lower()
        matched_role = None
        for available_role in available_roles:
            if available_role.lower() == role_lower:
                matched_role = available_role
                break

        if matched_role is None:
            logger.error(
                "Role '%s' not found in %s. Available roles: %s",
                role,
                functional_layer_json_path,
                available_roles,
            )
            raise ValueError(
                f"Role '{role}' not found. Available roles: {available_roles}"
            )
        roles_to_process = [matched_role]
    else:
        logger.debug("Processing all roles")
        roles_to_process = available_roles

    result: List[Dict] = []
    total_packages = 0

    for role_name in roles_to_process:
        feature = feature_list.features[role_name]
        packages_list = []

        for pkg in feature.packages:
            pkg_dict = {
                "name": pkg.package,
                "type": pkg.type,
                "repo_name": pkg.repo_name if pkg.repo_name else None,
                "architecture": pkg.architecture,
                "uri": pkg.uri,
                "tag": pkg.tag,
            }
            packages_list.append(pkg_dict)

        role_obj = {
            "roleName": role_name,
            "packages": packages_list,
        }
        result.append(role_obj)
        total_packages += len(packages_list)
        logger.debug(
            "Processed role '%s': %d packages",
            role_name,
            len(packages_list),
        )

    logger.info(
        "get_package_list completed for %s: %d role(s), %d total package(s)",
        functional_layer_json_path,
        len(result),
        total_packages,
    )

    return result


def generate_root_json_from_catalog(
    catalog_path: str,
    schema_path: str = _DEFAULT_SCHEMA_PATH,
    output_root: str = "out/generator",
    *,
    log_file: Optional[str] = None,
    configure_logging: bool = False,
    log_level: int = logging.INFO,
) -> None:
    """Generate per-arch/OS/version FeatureList JSONs for a catalog file.

    - If configure_logging is True, logging is configured using _configure_logging,
      optionally writing to log_file.
    - On missing files, FileNotFoundError is raised after logging an error.
    - No sys.exit is called; callers are expected to handle exceptions.
    """
    # Optional logging configuration for library callers
    if configure_logging:
        _configure_logging(log_file=log_file, log_level=log_level)

    # Shared input validation
    _validate_catalog_and_schema_paths(catalog_path, schema_path)

    catalog = ParseCatalog(catalog_path, schema_path)

    functional_layer_json = generate_functional_layer_json(catalog)
    infrastructure_json = generate_infrastructure_json(catalog)
    drivers_json = generate_drivers_json(catalog)
    base_os_json = generate_base_os_json(catalog)
    miscellaneous_json = generate_miscellaneous_json(catalog)

    combos = _discover_arch_os_version_from_catalog(catalog)
    logger.info(
        "Discovered %d combination(s) for feature-list generation", len(combos)
    )

    for arch, os_name, version in combos:
        base_dir = os.path.join(output_root, arch, os_name, version)
        os.makedirs(base_dir, exist_ok=True)

        logger.info(
            "Generating feature-list JSONs for arch=%s os=%s version=%s into %s",
            arch,
            os_name,
            version,
            base_dir,
        )

        func_arch = _filter_featurelist_for_arch(functional_layer_json, arch)
        infra_arch = _filter_featurelist_for_arch(infrastructure_json, arch)
        drivers_arch = _filter_featurelist_for_arch(drivers_json, arch)
        base_os_arch = _filter_featurelist_for_arch(base_os_json, arch)
        misc_arch = _filter_featurelist_for_arch(miscellaneous_json, arch)

        serialize_json(func_arch, os.path.join(base_dir, 'functional_layer.json'))
        serialize_json(infra_arch, os.path.join(base_dir, 'infrastructure.json'))
        serialize_json(drivers_arch, os.path.join(base_dir, 'drivers.json'))
        serialize_json(base_os_arch, os.path.join(base_dir, 'base_os.json'))
        serialize_json(misc_arch, os.path.join(base_dir, 'miscellaneous.json'))


if __name__ == "__main__":
    # Example usage: generate per-arch/OS/version FeatureList JSONs under
    # out/<arch>/<os_name>/<version>/

    parser = argparse.ArgumentParser(description="Catalog Parser CLI")
    parser.add_argument(
        "--catalog",
        required=True,
        help="Path to input catalog JSON file",
    )
    parser.add_argument(
        "--schema",
        required=False,
        default=_DEFAULT_SCHEMA_PATH,
        help="Path to catalog schema JSON file",
    )
    parser.add_argument(
        "--log-file",
        required=False,
        default=None,
        help="Path to log file; if not set, logs go to stderr",
    )

    args = parser.parse_args()

    # Configure logging once for the CLI
    _configure_logging(log_file=args.log_file, log_level=logging.INFO)

    logger.info("Catalog Parser CLI started for %s", args.catalog)

    try:
        # Reuse the programmatic API to generate all FeatureList JSONs.
        generate_root_json_from_catalog(
            catalog_path=args.catalog,
            schema_path=args.schema,
            output_root=os.path.join("out", "main"),
        )

        logger.info("Catalog Parser CLI completed for %s", args.catalog)

    except FileNotFoundError:
        logger.error("File not found during processing")
        sys.exit(ERROR_CODE_INPUT_NOT_FOUND)
    except ValidationError:
        sys.exit(ERROR_CODE_PROCESSING_ERROR)
    except Exception:
        logger.exception("Unexpected error while generating feature-list JSONs")
        sys.exit(ERROR_CODE_PROCESSING_ERROR)

================================================
FILE: build_stream/core/catalog/models.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Catalog parser models.

Contains the dataclass-based in-memory representations of catalog components.
"""

from dataclasses import dataclass
from typing import List, Optional

@dataclass
class Package:
    """Generic package entry from the catalog.

    Represents a single software package with name, version, supported OS list,
    architecture list, and optional source metadata.
    """

    id: str
    name: str
    version: str
    supported_os: List[str]
    uri: str
    architecture: List[str]
    type: str
    tag: str = ""
    sources: Optional[List[dict]] = None

@dataclass
class FunctionalPackage(Package):
    """Package that belongs to the functional layer of the catalog."""

@dataclass
class OsPackage(Package):
    """Package that belongs to the base OS layer of the catalog."""

@dataclass
class InfrastructurePackage:
    """Infrastructure package as described in the catalog."""

    def __init__(self, id, name, version, uri, architecture, config, type, sources=None, tag=""):
        self.id = id
        self.name = name
        self.version = version
        self.uri = uri
        self.architecture = architecture
        self.config = config
        self.type = type
        self.sources = sources
        self.tag = tag

@dataclass
class Driver:
    """Driver package entry used by the drivers layer of the catalog."""

    def __init__(self, id, name, version, uri, architecture, config, type):
        self.id = id
        self.name = name
        self.version = version
        self.uri = uri
        self.architecture = architecture
        self.config = config
        self.type = type

@dataclass
class Catalog:
    """Top-level in-memory representation of the catalog JSON.

    Holds raw layer sections and the resolved package objects used by
    generator and adapter components.
    """

    name: str
    version: str
    functional_layer: List[dict]
    base_os: List[dict]
    infrastructure: List[dict]
    drivers_layer: List[dict]
    drivers: List[Driver]
    functional_packages: List[FunctionalPackage]
    os_packages: List[OsPackage]
    infrastructure_packages: List[InfrastructurePackage]
    miscellaneous: List[str]

================================================
FILE: build_stream/core/catalog/parser.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Catalog parser.

Loads and validates a catalog JSON file against CatalogSchema.json and
materializes it into model objects.
"""

import json
import logging
import os
from jsonschema import validate, ValidationError
from .models import Catalog, FunctionalPackage, OsPackage, InfrastructurePackage, Driver
from .utils import load_json_file

logger = logging.getLogger(__name__)

_BASE_DIR = os.path.dirname(__file__)
_DEFAULT_SCHEMA_PATH = os.path.join(_BASE_DIR, "resources", "CatalogSchema.json")

def ParseCatalog(file_path: str, schema_path: str = _DEFAULT_SCHEMA_PATH) -> Catalog:
    """Parse a catalog JSON file and validate it against the JSON schema.

    Args:
        file_path: Path to the catalog JSON file.
        schema_path: Path to the JSON schema used for validation.

    Returns:
        A populated Catalog instance built from the validated JSON data.
    """

    logger.info("Parsing catalog from %s using schema %s", file_path, schema_path)
    schema = load_json_file(schema_path)
    catalog_json = load_json_file(file_path)

    logger.debug("Validating catalog JSON against schema")
    try:
        validate(instance=catalog_json, schema=schema)
    except ValidationError:
        logger.error(
            "Catalog validation failed for %s",
            file_path,
        )
        raise
    data = catalog_json["Catalog"]

    functional_packages = [
        FunctionalPackage(
            id=key,
            name=pkg["Name"],
            version=pkg.get("Version", ""),
            supported_os=[f"{os['Name']} {os['Version']}" for os in pkg["SupportedOS"]],
            uri="",
            type=pkg["Type"],
            architecture=pkg["Architecture"],
            tag=pkg.get("Tag", ""),
            sources=pkg.get("Sources", []),
        )
        for key, pkg in data["FunctionalPackages"].items()
    ]

    os_packages = [
        OsPackage(
            id=key,
            name=pkg["Name"],
            version=pkg.get("Version", ""),
            supported_os=[f"{os['Name']} {os['Version']}" for os in pkg["SupportedOS"]],
            uri="",
            architecture=pkg["Architecture"],
            sources=pkg.get("Sources", []),
            type=pkg["Type"],
            tag=pkg.get("Tag", ""),
        )
        for key, pkg in data["OSPackages"].items()
    ]

    infrastructure_packages = [
        InfrastructurePackage(
            id=key,
            name=pkg["Name"],
            version=pkg["Version"],
            uri=pkg.get("Uri", ""),
            architecture=pkg.get("Architecture", []),
            config=pkg["SupportedFunctions"],
            type=pkg["Type"],
            sources=pkg.get("Sources", []),
            tag=pkg.get("Tag", ""),
        )
        for key, pkg in data["InfrastructurePackages"].items()
    ]

    driver_packages = data.get("DriverPackages", {})
    drivers = [
        Driver(
            id=key,
            name=drv["Name"],
            version=drv["Version"],
            uri=drv["Uri"],
            architecture=drv["Architecture"],
            config=drv["Config"],
            type=drv["Type"],
        )
        for key, drv in driver_packages.items()
    ]

    catalog = Catalog(
        name=data["Name"],
        version=data["Version"],
        functional_layer=data["FunctionalLayer"],
        base_os=data["BaseOS"],
        infrastructure=data["Infrastructure"],
        drivers_layer=data.get("Drivers", []),
        drivers=drivers,
        functional_packages=functional_packages,
        os_packages=os_packages,
        infrastructure_packages=infrastructure_packages,
        miscellaneous=data.get("Miscellaneous", []),
    )

    logger.info(
        "Parsed catalog %s v%s: %d functional, %d OS, %d infrastructure, %d drivers",
        catalog.name,
        catalog.version,
        len(functional_packages),
        len(os_packages),
        len(infrastructure_packages),
        len(drivers),
    )

    return catalog


================================================
FILE: build_stream/core/catalog/resources/AdapterPolicySchema.json
================================================
{
  "$schema": "http://json-schema.org/draft-07/schema#",
  "$id": "AdapterPolicySchema.json",
  "title": "Target-Centric Mapping Schema",
  "description": "Schema defining how to build target config JSON files from one or more source JSON files, including derived roles.",
  "type": "object",
  "properties": {
    "version": {
      "type": "string",
      "description": "Schema version for future compatibility"
    },
    "description": {
      "type": "string",
      "description": "Human-readable description of this mapping configuration"
    },
    "architectures": {
      "type": "array",
      "description": "List of supported architectures",
      "items": {
        "type": "string"
      },
      "minItems": 1,
      "uniqueItems": true
    },
    "targets": {
      "type": "object",
      "description": "Target files to generate (filename -> target spec)",
      "additionalProperties": {
        "$ref": "#/definitions/targetSpec"
      }
    }
  },
  "required": ["version", "targets"],
  "definitions": {
    "targetSpec": {
      "type": "object",
      "description": "Specification for building a single target file",
      "properties": {
        "sources": {
          "type": "array",
          "description": "Source files and roles to pull into this target",
          "items": {
            "$ref": "#/definitions/sourceSpec"
          }
        },
        "derived": {
          "type": "array",
          "description": "Derived roles computed from pulled roles",
          "items": {
            "$ref": "#/definitions/derivedSpec"
          }
        },
        "transform": {
          "$ref": "#/definitions/transform",
          "description": "Transform applied to all packages in this target (unless overridden per pull)"
        },
        "conditions": {
          "$ref": "#/definitions/conditions",
          "description": "Optional conditions for when this target applies"
        }
      },
      "required": ["sources"]
    },
    "sourceSpec": {
      "type": "object",
      "description": "Defines which roles (keys) to pull from a given source file",
      "properties": {
        "source_file": {
          "type": "string",
          "description": "Input file name (without path, e.g., 'functional_layer.json')"
        },
        "pulls": {
          "type": "array",
          "description": "Roles to pull from the source file",
          "items": {
            "$ref": "#/definitions/pullSpec"
          },
          "minItems": 1
        }
      },
      "required": ["source_file", "pulls"]
    },
    "pullSpec": {
      "type": "object",
      "description": "Pull a role from a source file into the target file, optionally renaming and filtering",
      "properties": {
        "source_key": {
          "type": "string",
          "description": "Role/key in the source file"
        },
        "target_key": {
          "type": "string",
          "description": "Role/key to write into the target file; defaults to source_key if omitted"
        },
        "filter": {
          "$ref": "#/definitions/filter",
          "description": "Optional filter for this role"
        },
        "transform": {
          "$ref": "#/definitions/transform",
          "description": "Optional per-role transform override"
        }
      },
      "required": ["source_key"]
    },
    "derivedSpec": {
      "type": "object",
      "description": "A derived role definition",
      "properties": {
        "target_key": {
          "type": "string",
          "description": "Role/key to create in the target file"
        },
        "operation": {
          "$ref": "#/definitions/operation"
        }
      },
      "required": ["target_key", "operation"]
    },
    "operation": {
      "type": "object",
      "description": "Operation to derive a role and remove common packages from source roles",
      "properties": {
        "type": {
          "type": "string",
          "enum": ["extract_common"],
          "description": "Currently supported derived operation types"
        },
        "from_keys": {
          "type": "array",
          "description": "Target roles to compare",
          "items": {
            "type": "string"
          },
          "minItems": 2
        },
        "min_occurrences": {
          "type": "integer",
          "description": "Minimum occurrences across from_keys to be considered common",
          "default": 2
        },
        "remove_from_sources": {
          "type": "boolean",
          "description": "If true, common packages are removed from each role in from_keys",
          "default": true
        }
      },
      "required": ["type", "from_keys"]
    },
    "conditions": {
      "type": "object",
      "description": "Conditions that determine when a mapping rule applies",
      "properties": {
        "architectures": {
          "type": "array",
          "description": "Limit this mapping to specific architectures. If omitted, applies to all.",
          "items": {
            "type": "string"
          }
        },
        "os_versions": {
          "type": "array",
          "description": "Limit this mapping to specific OS versions (e.g., ['10.0', '9.0'])",
          "items": {
            "type": "string"
          }
        },
        "os_families": {
          "type": "array",
          "description": "Limit this mapping to specific OS families (e.g., ['rhel', 'ubuntu'])",
          "items": {
            "type": "string"
          }
        }
      }
    },
    "transform": {
      "type": "object",
      "description": "Transformation rules to apply when writing package objects",
      "properties": {
        "exclude_fields": {
          "type": "array",
          "description": "Fields to exclude from package objects",
          "items": {
            "type": "string"
          }
        },
        "rename_fields": {
          "type": "object",
          "description": "Field renaming map (old_name -> new_name)",
          "additionalProperties": {
            "type": "string"
          }
        }
      }
    },
    "filter": {
      "type": "object",
      "description": "Filter rules to select specific packages from source",
      "properties": {
        "type": {
          "type": "string",
          "description": "Type of filter to apply",
          "enum": ["substring", "allowlist", "field_in", "any_of"]
        },
        "field": {
          "type": "string",
          "description": "Field to apply filter on (for substring filter)",
          "default": "package"
        },
        "values": {
          "type": "array",
          "description": "Values to match against (for substring filter)",
          "items": {
            "type": "string"
          }
        },
        "case_sensitive": {
          "type": "boolean",
          "description": "Whether substring matching is case-sensitive",
          "default": false
        },
        "filters": {
          "type": "array",
          "description": "Sub-filters for composite any_of filter",
          "items": {
            "$ref": "#/definitions/filter"
          },
          "minItems": 1
        }
      },
      "allOf": [
        {
          "if": {"properties": {"type": {"const": "any_of"}}},
          "then": {"required": ["filters"]}
        }
      ],
      "required": ["type"]
    }
  }
}


================================================
FILE: build_stream/core/catalog/resources/CatalogSchema.json
================================================
{
  "$schema": "https://json-schema.org/draft-07/schema#",
  "schemaVersion": "1.0",
  "title": "Catalog",
  "type": "object",
  "properties": {
    "Catalog": {
      "type": "object",
      "properties": {
        "Name": {"type": "string"},
        "Version": {"type": "string"},
        "Identifier": {"type": "string"},
        "FunctionalLayer": {
          "type": "array",
          "items": {
            "type": "object",
            "properties": {
              "Name": {"type": "string"},
              "FunctionalPackages": {
                "type": "array",
                "items": {"type": "string"}
              }
            },
            "required": ["Name", "FunctionalPackages"]
          }
        },
        "BaseOS": {
          "type": "array",
          "items": {
            "type": "object",
            "properties": {
              "Name": {"type": "string"},
              "Version": {"type": "string"},
              "osPackages": {
                "type": "array",
                "items": {"type": "string"}
              }
            },
            "required": ["osPackages"]
          }
        },
        "Infrastructure": {
          "type": "array",
          "items": {
            "type": "object",
            "properties": {
              "Name": {"type": "string"},
              "InfrastructurePackages": {
                "type": "array",
                "items": {"type": "string"}
              }
            },
            "required": ["Name", "InfrastructurePackages"]
          }
        },
        "Miscellaneous": {
          "type": "array",
          "items": {"type": "string"}
        },
        "Drivers": {
          "type": "array",
          "items": {
            "type": "object",
            "properties": {
              "Name": {"type": "string"},
              "DriverPackages": {
                "type": "array",
                "items": {"type": "string"}
              }
            },
            "required": ["Name", "DriverPackages"]
          }
        },
        "DriverPackages": {
          "type": "object",
          "additionalProperties": {
            "type": "object",
            "properties": {
              "Name": {"type": "string"},
              "Version": {"type": "string"},
              "Uri": {"type": "string"},
              "Architecture": {
                "type": "array",
                "items": {"type": "string"}
              },
              "Type": {"type": "string"},
              "Config": {
                "type": "object",
                "properties": {
                  "DriverBrand": {"type": "string"},
                  "DriverType": {"type": "string"}
                },
                "required": ["DriverBrand", "DriverType"]
              }
            },
            "required": ["Name", "Version", "Uri", "Architecture", "Type", "Config"]
          }
        },
        "FunctionalPackages": {
          "type": "object",
          "additionalProperties": {
            "type": "object",
            "properties": {
              "Name": {"type": "string"},
              "Version": {"type": "string"},
              "Tag": {"type": "string"},
              "SupportedOS": {
                "type": "array",
                "items": {
                  "type": "object",
                  "properties": {
                    "Name": {"type": "string"},
                    "Version": {"type": "string"}
                  },
                  "required": ["Name", "Version"]
                }
              },
              "Sources": {
                "type": "array",
                "items": {
                  "type": "object",
                  "properties": {
                    "Architecture": {"type": "string"},
                    "RepoName": {"type": "string"},
                    "Uri": {"type": "string"}
                  },
                  "required": ["Architecture"],
                  "anyOf": [
                    {"required": ["RepoName"]},
                    {"required": ["Uri"]}
                  ]
                }
              },
              "Architecture": {
                "type": "array",
                "items": {"type": "string"}
              },
              "Type": {"type": "string"}
            },
            "required": ["Name", "SupportedOS", "Architecture", "Type"]
          }
        },
        "OSPackages": {
          "type": "object",
          "additionalProperties": {
            "type": "object",
            "properties": {
              "Name": {"type": "string"},
              "Version": {"type": "string"},
              "Tag": {"type": "string"},
              "SupportedOS": {
                "type": "array",
                "items": {
                  "type": "object",
                  "properties": {
                    "Name": {"type": "string"},
                    "Version": {"type": "string"}
                  },
                  "required": ["Name", "Version"]
                }
              },
              "Sources": {
                "type": "array",
                "items": {
                  "type": "object",
                  "properties": {
                    "Architecture": {"type": "string"},
                    "RepoName": {"type": "string"},
                    "Uri": {"type": "string"}
                  },
                  "required": ["Architecture"],
                  "anyOf": [
                    {"required": ["RepoName"]},
                    {"required": ["Uri"]}
                  ]
                }
              },
              "Architecture": {
                "type": "array",
                "items": {"type": "string"}
              },
              "Type": {"type": "string"}
            },
            "required": ["Name", "SupportedOS", "Architecture", "Type"]
          }
        },
        "InfrastructurePackages": {
          "type": "object",
          "additionalProperties": {
            "type": "object",
            "properties": {
              "Name": {"type": "string"},
              "Version": {"type": ["string", "null"]},
              "Tag": {"type": "string"},
              "Type": {"type": "string"},
              "Architecture": {
                "type": "array",
                "items": {"type": "string"}
              },
              "SupportedFunctions": {
                "type": "array",
                "items": {
                  "type": "object",
                  "properties": {
                    "Name": {"type": "string"}
                  },
                  "required": ["Name"]
                }
              }
            },
            "required": ["Name", "Type", "SupportedFunctions"]
          }
        }
      },
      "required": [
        "Name",
        "Version",
        "Identifier",
        "FunctionalLayer",
        "BaseOS",
        "Infrastructure",
        "Drivers",
        "DriverPackages",
        "FunctionalPackages",
        "OSPackages",
        "InfrastructurePackages"
      ]
    }
  },
  "required": ["Catalog"]
}

================================================
FILE: build_stream/core/catalog/resources/RootLevelSchema.json
================================================
{
  "$schema": "http://json-schema.org/draft-07/schema#",
  "title": "Root Feature List",
  "type": "object",
  "description": "Schema for root jsons produced by catalog_parser. Top-level keys are role names; each role contains a packages array.",
  "additionalProperties": {
    "type": "object",
    "required": [
      "packages"
    ],
    "properties": {
      "packages": {
        "type": "array",
        "items": {
          "type": "object",
          "required": [
            "package",
            "type",
            "architecture"
          ],
          "properties": {
            "package": {
              "type": "string"
            },
            "type": {
              "type": "string",
              "description": "Package source type (e.g., rpm, pip_module, image, tarball, git)."
            },
            "repo_name": {
              "type": "string"
            },
            "architecture": {
              "type": "array",
              "items": {
                "type": "string"
              },
              "minItems": 1
            },
            "uri": {
              "type": "string"
            },
            "tag": {
              "type": "string"
            },
            "sources": {
              "type": "array",
              "items": {
                "type": "object",
                "properties": {
                  "Architecture": { "type": "string" },
                  "RepoName": { "type": "string" },
                  "Uri": { "type": "string" }
                },
                "additionalProperties": true
              }
            }
          },
          "additionalProperties": true
        }
      }
    },
    "additionalProperties": true
  }
}


================================================
FILE: build_stream/core/catalog/resources/adapter_policy_default.json
================================================
{
  "version": "2.0.0",
  "description": "Target-centric mapping spec: pull roles into each target file, then derive common roles and remove duplicates.",
  "architectures": ["aarch64", "x86_64"],
  "targets": {
    "default_packages.json": {
      "transform": {
        "exclude_fields": ["architecture"],
        "rename_fields": {"uri": "url"}
      },
      "sources": [
        {
          "source_file": "base_os.json",
          "pulls": [
            {
              "source_key": "Base OS",
              "target_key": "default_packages",
              "filter": {
                "type": "allowlist",
                "field": "package",
                "values": ["systemd", "systemd-udev", "kernel", "dracut", "dracut-live", "dracut-network", "squashfs-tools", "nfs-utils", "nfs4-acl-tools", "NetworkManager", "nm-connection-editor", "iproute", "iputils", "curl", "bash", "coreutils", "grep", "sed", "gawk", "findutils", "util-linux", "kbd", "lsof", "cryptsetup", "lvm2", "device-mapper", "rsyslog", "chrony", "sudo", "gzip", "wget", "cloud-init", "glibc-langpack-en", "gedit", "docker.io/dellhpcomniaaisolution/image-build-aarch64", "docker.io/dellhpcomniaaisolution/image-build-el10"],
                "case_sensitive": false
              }
            }
          ]
        }
      ]
    },
    "admin_debug_packages.json": {
      "transform": {
        "exclude_fields": ["architecture"],
        "rename_fields": {"uri": "url"}
      },
      "sources": [
        {
          "source_file": "base_os.json",
          "pulls": [
            {
              "source_key": "Base OS",
              "target_key": "admin_debug_packages",
              "filter": {
                "type": "allowlist",
                "field": "package",
                "values": ["which", "tcpdump", "traceroute", "iperf3", "fping", "dmidecode", "hwloc", "hwloc-libs", "lshw", "pciutils", "vim-enhanced", "emacs", "zsh", "openssh", "openssh-server", "openssh-clients", "rsync", "file", "libcurl", "tar", "bzip2", "man-db", "man-pages", "strace", "kexec-tools", "openssl-devel", "ipmitool", "gdb", "gdb-gdbserver", "lldb", "lldb-devel", "valgrind", "valgrind-devel", "ltrace", "kernel-tools", "perf", "papi", "papi-devel", "papi-libs", "cmake", "make", "autoconf", "automake", "libtool", "gcc", "gcc-c++", "gcc-gfortran", "binutils", "binutils-devel", "clustershell", "bash-completion"],
                "case_sensitive": false
              }
            }
          ]
        }
      ]
    },
    "openldap.json": {
      "transform": {
        "exclude_fields": ["architecture"],
        "rename_fields": {"uri": "url"}
      },
      "sources": [
        {
          "source_file": "base_os.json",
          "pulls": [
            {
              "source_key": "Base OS",
              "target_key": "openldap",
              "filter": {
                "type": "allowlist",
                "field": "package",
                "values": ["openldap-clients", "nss-pam-ldapd", "sssd", "oddjob-mkhomedir", "authselect"],
                "case_sensitive": false
              }
            }
          ]
        }
      ]
    },
    "ldms.json": {
      "transform": {
        "exclude_fields": ["architecture"],
        "rename_fields": {"uri": "url"}
      },
      "sources": [
        {
          "source_file": "base_os.json",
          "pulls": [
            {
              "source_key": "Base OS",
              "target_key": "ldms",
              "filter": {
                "type": "allowlist",
                "field": "package",
                "values": ["python3-devel", "python3-cython", "openssl-libs", "ovis-ldms"],
                "case_sensitive": false
              }
            }
          ]
        }
      ]
    },
    "ucx.json": {
      "transform": {
        "exclude_fields": ["architecture"],
        "rename_fields": {"uri": "url"}
      },
      "sources": [
        {
          "source_file": "base_os.json",
          "pulls": [
            {
              "source_key": "Base OS",
              "target_key": "ucx",
              "filter": {
                "type": "allowlist",
                "field": "package",
                "values": ["ucx", "gcc-c++", "make"],
                "case_sensitive": false
              }
            }
          ]
        }
      ]
    },
    "openmpi.json": {
      "transform": {
        "exclude_fields": ["architecture"],
        "rename_fields": {"uri": "url"}
      },
      "sources": [
        {
          "source_file": "base_os.json",
          "pulls": [
            {
              "source_key": "Base OS",
              "target_key": "openmpi",
              "filter": {
                "type": "allowlist",
                "field": "package",
                "values": ["openmpi", "pmix-devel", "munge-devel","gcc-c++", "make"],
                "case_sensitive": false
              }
            }
          ]
        }
      ]
    },
    "service_k8s.json": {
      "conditions": {
        "architectures": ["x86_64"]
      },
      "transform": {
        "exclude_fields": ["architecture"],
        "rename_fields": {"uri": "url"}
      },
      "sources": [
        {
          "source_file": "functional_layer.json",
          "pulls": [
            {"source_key": "service_kube_control_plane_x86_64", "target_key": "service_kube_control_plane"},
            {"source_key": "service_kube_control_plane_x86_64", "target_key": "service_kube_control_plane_first"},
            {"source_key": "service_kube_node_x86_64", "target_key": "service_kube_node"}
          ]
        }
      ],
      "derived": [
        {
          "target_key": "service_k8s",
          "operation": {
            "type": "extract_common",
            "from_keys": ["service_kube_control_plane_first", "service_kube_control_plane", "service_kube_node"],
            "min_occurrences": 3,
            "remove_from_sources": true
          }
        }
      ]
    },
    "slurm_custom.json": {
      "transform": {
        "exclude_fields": ["architecture"],
        "rename_fields": {"uri": "url"}
      },
      "sources": [
        {
          "source_file": "functional_layer.json",
          "pulls": [
            {"source_key": "slurm_control_node_x86_64", "target_key": "slurm_control_node"},
            {"source_key": "slurm_node_x86_64", "target_key": "slurm_node"},
            {"source_key": "slurm_node_aarch64", "target_key": "slurm_node"},
            {"source_key": "login_node_x86_64", "target_key": "login_node"},
            {"source_key": "login_node_aarch64", "target_key": "login_node"},
            {"source_key": "login_compiler_node_x86_64", "target_key": "login_compiler_node"},
            {"source_key": "login_compiler_node_aarch64", "target_key": "login_compiler_node"}
          ]
        }
      ],
      "derived": [
        {
          "target_key": "slurm_custom",
          "operation": {
            "type": "extract_common",
            "from_keys": ["login_node", "login_compiler_node", "slurm_control_node", "slurm_node"],
            "min_occurrences": 4,
            "remove_from_sources": true
          }
        }
      ]
    },
    "additional_packages.json": {
      "transform": {
        "exclude_fields": ["architecture"],
        "rename_fields": {"uri": "url"}
      },
      "sources": [
        {
          "source_file": "miscellaneous.json",
          "pulls": [
            {"source_key": "slurm_control_node_x86_64", "target_key": "slurm_control_node"},
            {"source_key": "slurm_node_x86_64", "target_key": "slurm_node"},
            {"source_key": "slurm_node_aarch64", "target_key": "slurm_node"},
            {"source_key": "login_node_x86_64", "target_key": "login_node"},
            {"source_key": "login_node_aarch64", "target_key": "login_node"},
            {"source_key": "login_compiler_node_x86_64", "target_key": "login_compiler_node"},
            {"source_key": "login_compiler_node_aarch64", "target_key": "login_compiler_node"},
            {"source_key": "service_kube_control_plane_x86_64", "target_key": "service_kube_control_plane"},
            {"source_key": "service_kube_control_plane_x86_64", "target_key": "service_kube_control_plane_first"},
            {"source_key": "service_kube_node_x86_64", "target_key": "service_kube_node"}
          ]
        }
      ]
    },
    "csi_driver_powerscale.json": {
      "conditions": {
        "architectures": ["x86_64"]
      },
      "transform": {
        "exclude_fields": ["architecture"],
        "rename_fields": {"uri": "url"}
      },
      "sources": [
        {
          "source_file": "infrastructure.json",
          "pulls": [
            {
              "source_key": "csi",
              "target_key": "csi_driver_powerscale",
              "filter": {
                "type": "allowlist",
                "field": "package",
                "values": ["csi-powerscale", "external-snapshotter", "helm-charts", "quay.io/dell/container-storage-modules/csi-isilon", "registry.k8s.io/sig-storage/csi-attacher", "registry.k8s.io/sig-storage/csi-provisioner", "registry.k8s.io/sig-storage/csi-snapshotter", "registry.k8s.io/sig-storage/csi-resizer", "registry.k8s.io/sig-storage/csi-node-driver-registrar", "registry.k8s.io/sig-storage/csi-external-health-monitor-controller", "quay.io/dell/container-storage-modules/dell-csi-replicator", "quay.io/dell/container-storage-modules/podmon", "quay.io/dell/container-storage-modules/csm-authorization-sidecar", "quay.io/dell/container-storage-modules/csi-metadata-retriever", "registry.k8s.io/sig-storage/snapshot-controller", "docker.io/dellemc/csm-encryption"],
                "case_sensitive": false
              }
            }
          ]
        }
      ]
    }
  }
}


================================================
FILE: build_stream/core/catalog/test_fixtures/adapter_policy_test.json
================================================
{
  "version": "2.0.0",
  "description": "Target-centric mapping spec: pull roles into each target file, then derive common roles and remove duplicates.",
  "architectures": ["aarch64", "x86_64"],
  "targets": {
    "default_packages.json": {
      "transform": {
        "exclude_fields": ["architecture"]
      },
      "sources": [
        {
          "source_file": "base_os.json",
          "pulls": [
            {
              "source_key": "Base OS",
              "target_key": "default_packages",
              "filter": {
                "type": "allowlist",
                "field": "package",
                "values": ["systemd", "systemd-udev", "kernel", "dracut", "dracut-live", "dracut-network", "squashfs-tools", "nfs-utils", "nfs4-acl-tools", "NetworkManager", "nm-connection-editor", "iproute", "iputils", "curl", "bash", "coreutils", "grep", "sed", "gawk", "findutils", "util-linux", "kbd", "lsof", "cryptsetup", "lvm2", "device-mapper", "rsyslog", "chrony", "sudo", "gzip", "wget", "cloud-init", "glibc-langpack-en", "gedit"],
                "case_sensitive": false
              }
            }
          ]
        }
      ]
    },
    "admin_debug_packages.json": {
      "transform": {
        "exclude_fields": ["architecture"]
      },
      "sources": [
        {
          "source_file": "base_os.json",
          "pulls": [
            {
              "source_key": "Base OS",
              "target_key": "admin_debug_packages",
              "filter": {
                "type": "allowlist",
                "field": "package",
                "values": ["which", "tcpdump", "traceroute", "iperf3", "fping", "dmidecode", "hwloc", "hwloc-libs", "lshw", "pciutils", "vim-enhanced", "emacs", "zsh", "openssh", "openssh-server", "openssh-clients", "rsync", "file", "libcurl", "tar", "bzip2", "man-db", "man-pages", "strace", "kexec-tools", "openssl-devel", "ipmitool", "gdb", "gdb-gdbserver", "lldb", "lldb-devel", "valgrind", "valgrind-devel", "ltrace", "kernel-tools", "perf", "papi", "papi-devel", "papi-libs", "cmake", "make", "autoconf", "automake", "libtool", "gcc", "gcc-c++", "gcc-gfortran", "binutils", "binutils-devel", "clustershell", "bash-completion"],
                "case_sensitive": false
              }
            }
          ]
        }
      ]
    },
    "openldap.json": {
      "transform": {
        "exclude_fields": ["architecture"]
      },
      "sources": [
        {
          "source_file": "base_os.json",
          "pulls": [
            {
              "source_key": "Base OS",
              "target_key": "openldap",
              "filter": {
                "type": "allowlist",
                "field": "package",
                "values": ["openldap-clients", "nss-pam-ldapd", "sssd", "oddjob-mkhomedir", "authselect"],
                "case_sensitive": false
              }
            }
          ]
        }
      ]
    },
    "ldms.json": {
      "transform": {
        "exclude_fields": ["architecture"]
      },
      "sources": [
        {
          "source_file": "base_os.json",
          "pulls": [
            {
              "source_key": "Base OS",
              "target_key": "ldms",
              "filter": {
                "type": "allowlist",
                "field": "package",
                "values": ["python3-devel", "python3-cython", "openssl-libs", "ovis-ldms"],
                "case_sensitive": false
              }
            }
          ]
        }
      ]
    },
    "service_k8s.json": {
      "transform": {
        "exclude_fields": ["architecture"]
      },
      "sources": [
        {
          "source_file": "functional_layer.json",
          "pulls": [
            {"source_key": "service_kube_control_plane_x86_64", "target_key": "service_kube_control_plane_first"},
            {"source_key": "service_kube_control_plane_x86_64", "target_key": "service_kube_control_plane"},
            {"source_key": "service_kube_node_x86_64", "target_key": "service_kube_node"}
          ]
        }
      ],
      "derived": [
        {
          "target_key": "service_k8s",
          "operation": {
            "type": "extract_common",
            "from_keys": ["service_kube_control_plane_first", "service_kube_control_plane", "service_kube_node"],
            "min_occurrences": 2,
            "remove_from_sources": true
          }
        }
      ]
    },
    "slurm_custom.json": {
      "transform": {
        "exclude_fields": ["architecture"]
      },
      "sources": [
        {
          "source_file": "functional_layer.json",
          "pulls": [
            {"source_key": "login_node_x86_64", "target_key": "login_node"},
            {"source_key": "login_node_aarch64", "target_key": "login_node"},
            {"source_key": "login_compiler_node_x86_64", "target_key": "login_compiler_node"},
            {"source_key": "login_compiler_node_aarch64", "target_key": "login_compiler_node"},
            {"source_key": "slurm_control_node_x86_64", "target_key": "slurm_control_node"},
            {"source_key": "slurm_node_x86_64", "target_key": "slurm_node"},
            {"source_key": "slurm_node_aarch64", "target_key": "slurm_node"}
          ]
        }
      ],
      "derived": [
        {
          "target_key": "slurm_custom",
          "operation": {
            "type": "extract_common",
            "from_keys": ["login_node", "login_compiler_node", "slurm_control_node", "slurm_node"],
            "min_occurrences": 2,
            "remove_from_sources": true
          }
        }
      ]
    },
    "additional_packages.json": {
      "transform": {
        "exclude_fields": ["architecture"]
      },
      "sources": [
        {
          "source_file": "functional_layer.json",
          "pulls": [
            {"source_key": "login_node_x86_64", "target_key": "login_node"},
            {"source_key": "login_node_aarch64", "target_key": "login_node"},
            {"source_key": "login_compiler_node_x86_64", "target_key": "login_compiler_node"},
            {"source_key": "login_compiler_node_aarch64", "target_key": "login_compiler_node"},
            {"source_key": "slurm_control_node_x86_64", "target_key": "slurm_control_node"},
            {"source_key": "slurm_node_x86_64", "target_key": "slurm_node"},
            {"source_key": "slurm_node_aarch64", "target_key": "slurm_node"},
            {"source_key": "service_kube_control_plane_x86_64", "target_key": "service_kube_control_plane_first"},
            {"source_key": "service_kube_control_plane_x86_64", "target_key": "service_kube_control_plane"},
            {"source_key": "service_kube_node_x86_64", "target_key": "service_kube_node"}
          ]
        }
      ]
    },
    "csi_driver_powerscale.json": {
      "transform": {
        "exclude_fields": ["architecture"]
      },
      "sources": [
        {
          "source_file": "base_os.json",
          "pulls": [
            {
              "source_key": "Base OS",
              "target_key": "csi_driver_powerscale",
              "filter": {
                "type": "allowlist",
                "field": "package",
                "values": ["csi-powerscale", "external-snapshotter", "helm-charts", "quay.io/dell/container-storage-modules/csi-isilon", "registry.k8s.io/sig-storage/csi-attacher", "registry.k8s.io/sig-storage/csi-provisioner", "registry.k8s.io/sig-storage/csi-snapshotter", "registry.k8s.io/sig-storage/csi-resizer", "registry.k8s.io/sig-storage/csi-node-driver-registrar", "registry.k8s.io/sig-storage/csi-external-health-monitor-controller", "quay.io/dell/container-storage-modules/dell-csi-replicator", "quay.io/dell/container-storage-modules/podmon", "quay.io/dell/container-storage-modules/csm-authorization-sidecar", "quay.io/dell/container-storage-modules/csi-metadata-retriever", "registry.k8s.io/sig-storage/snapshot-controller", "docker.io/dellemc/csm-encryption"],
                "case_sensitive": false
              }
            }
          ]
        }
      ]
    }
  }
}


================================================
FILE: build_stream/core/catalog/test_fixtures/catalog_rhel.json
================================================
{
  "Catalog": {
    "Name": "Catalog",
    "Version": "1.0",
    "Identifier": "image-build",
    "FunctionalLayer": [
      {
        "Name": "login_compiler_node_aarch64",
        "FunctionalPackages": [
          "package_id_13",
          "package_id_19",
          "package_id_2",
          "package_id_3",
          "package_id_4",
          "package_id_5",
          "package_id_6",
          "package_id_7",
          "package_id_8"
        ]
      },
      {
        "Name": "login_node_x86_64",
        "FunctionalPackages": [
          "package_id_13",
          "package_id_19",
          "package_id_2",
          "package_id_3",
          "package_id_4",
          "package_id_5",
          "package_id_6",
          "package_id_7",
          "package_id_8"
        ]
      },
      {
        "Name": "service_kube_control_plane_x86_64",
        "FunctionalPackages": [
          "package_id_1",
          "package_id_20",
          "package_id_21",
          "package_id_22",
          "package_id_23",
          "package_id_24",
          "package_id_25",
          "package_id_26",
          "package_id_27",
          "package_id_28",
          "package_id_29",
          "package_id_3",
          "package_id_30",
          "package_id_31",
          "package_id_32",
          "package_id_33",
          "package_id_34",
          "package_id_35",
          "package_id_36",
          "package_id_37",
          "package_id_38",
          "package_id_39",
          "package_id_4",
          "package_id_40",
          "package_id_41",
          "package_id_42",
          "package_id_43",
          "package_id_44",
          "package_id_45",
          "package_id_46",
          "package_id_47",
          "package_id_48",
          "package_id_49",
          "package_id_50",
          "package_id_51",
          "package_id_52",
          "package_id_53",
          "package_id_54",
          "package_id_55",
          "package_id_56",
          "package_id_57",
          "package_id_58",
          "package_id_59",
          "package_id_60",
          "package_id_61",
          "package_id_62",
          "package_id_63",
          "package_id_64",
          "package_id_65",
          "package_id_66",
          "package_id_67",
          "package_id_68",
          "package_id_7",
          "package_id_8"
        ]
      },
      {
        "Name": "service_kube_node_x86_64",
        "FunctionalPackages": [
          "package_id_1",
          "package_id_20",
          "package_id_21",
          "package_id_22",
          "package_id_23",
          "package_id_24",
          "package_id_25",
          "package_id_26",
          "package_id_27",
          "package_id_28",
          "package_id_29",
          "package_id_3",
          "package_id_30",
          "package_id_31",
          "package_id_32",
          "package_id_33",
          "package_id_34",
          "package_id_35",
          "package_id_36",
          "package_id_37",
          "package_id_38",
          "package_id_39",
          "package_id_4",
          "package_id_40",
          "package_id_41",
          "package_id_42",
          "package_id_43",
          "package_id_44",
          "package_id_45",
          "package_id_46",
          "package_id_47",
          "package_id_59",
          "package_id_69",
          "package_id_7",
          "package_id_70",
          "package_id_8"
        ]
      },
      {
        "Name": "slurm_control_node_x86_64",
        "FunctionalPackages": [
          "package_id_10",
          "package_id_11",
          "package_id_12",
          "package_id_2",
          "package_id_3",
          "package_id_4",
          "package_id_5",
          "package_id_6",
          "package_id_7",
          "package_id_71",
          "package_id_72",
          "package_id_73",
          "package_id_74",
          "package_id_8",
          "package_id_9"
        ]
      },
      {
        "Name": "slurm_node_aarch64",
        "FunctionalPackages": [
          "package_id_13",
          "package_id_14",
          "package_id_15",
          "package_id_16",
          "package_id_17",
          "package_id_18",
          "package_id_2",
          "package_id_3",
          "package_id_4",
          "package_id_5",
          "package_id_6",
          "package_id_7",
          "package_id_8"
        ]
      }
    ],
    "BaseOS": [
      {
        "Name": "RHEL",
        "Version": "10.0",
        "osPackages": [
          "os_package_id_1",
          "os_package_id_10",
          "os_package_id_11",
          "os_package_id_12",
          "os_package_id_13",
          "os_package_id_14",
          "os_package_id_15",
          "os_package_id_16",
          "os_package_id_17",
          "os_package_id_18",
          "os_package_id_19",
          "os_package_id_2",
          "os_package_id_20",
          "os_package_id_21",
          "os_package_id_22",
          "os_package_id_23",
          "os_package_id_24",
          "os_package_id_25",
          "os_package_id_26",
          "os_package_id_27",
          "os_package_id_28",
          "os_package_id_29",
          "os_package_id_3",
          "os_package_id_30",
          "os_package_id_31",
          "os_package_id_32",
          "os_package_id_33",
          "os_package_id_34",
          "os_package_id_35",
          "os_package_id_36",
          "os_package_id_37",
          "os_package_id_38",
          "os_package_id_39",
          "os_package_id_4",
          "os_package_id_40",
          "os_package_id_41",
          "os_package_id_42",
          "os_package_id_43",
          "os_package_id_44",
          "os_package_id_45",
          "os_package_id_46",
          "os_package_id_47",
          "os_package_id_48",
          "os_package_id_49",
          "os_package_id_5",
          "os_package_id_50",
          "os_package_id_51",
          "os_package_id_52",
          "os_package_id_53",
          "os_package_id_54",
          "os_package_id_55",
          "os_package_id_56",
          "os_package_id_57",
          "os_package_id_58",
          "os_package_id_59",
          "os_package_id_6",
          "os_package_id_60",
          "os_package_id_61",
          "os_package_id_62",
          "os_package_id_63",
          "os_package_id_64",
          "os_package_id_65",
          "os_package_id_66",
          "os_package_id_67",
          "os_package_id_68",
          "os_package_id_69",
          "os_package_id_7",
          "os_package_id_70",
          "os_package_id_71",
          "os_package_id_72",
          "os_package_id_73",
          "os_package_id_74",
          "os_package_id_75",
          "os_package_id_76",
          "os_package_id_77",
          "os_package_id_78",
          "os_package_id_79",
          "os_package_id_8",
          "os_package_id_80",
          "os_package_id_81",
          "os_package_id_82",
          "os_package_id_83",
          "os_package_id_84",
          "os_package_id_85",
          "os_package_id_86",
          "os_package_id_87",
          "os_package_id_88",
          "os_package_id_89",
          "os_package_id_9",
          "os_package_id_90",
          "os_package_id_91",
          "os_package_id_92",
          "os_package_id_93",
          "os_package_id_94",
          "os_package_id_95"
        ]
      }
    ],
    "Infrastructure": [],
    "Drivers": [],
    "DriverPackages": {},
    "FunctionalPackages": {
      "package_id_1": {
        "Name": "vim-enhanced",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_2": {
        "Name": "munge",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_3": {
        "Name": "firewalld",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "package_id_4": {
        "Name": "python3-firewall",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "package_id_5": {
        "Name": "pmix",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_6": {
        "Name": "nvcr.io/nvidia/hpc-benchmarks",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "image",
        "Tag": "25.09",
        "Version": "25.09"
      },
      "package_id_7": {
        "Name": "apptainer",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "epel"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "epel"
          }
        ]
      },
      "package_id_8": {
        "Name": "doca-ofed",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm_repo",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "doca"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "doca"
          }
        ]
      },
      "package_id_9": {
        "Name": "slurm-slurmctld",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_slurm_custom"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_slurm_custom"
          }
        ]
      },
      "package_id_10": {
        "Name": "slurm-slurmdbd",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_slurm_custom"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_slurm_custom"
          }
        ]
      },
      "package_id_11": {
        "Name": "python3-PyMySQL",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_12": {
        "Name": "mariadb-server",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_13": {
        "Name": "slurm-slurmd",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_slurm_custom"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_slurm_custom"
          }
        ]
      },
      "package_id_14": {
        "Name": "slurm-pam_slurm",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_slurm_custom"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_slurm_custom"
          }
        ]
      },
      "package_id_15": {
        "Name": "kernel-devel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_16": {
        "Name": "kernel-headers",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_17": {
        "Name": "cuda-run",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "iso",
        "Sources": [
          {
            "Architecture": "aarch64",
            "Uri": "https://developer.download.nvidia.com/compute/cuda/13.0.2/local_installers/cuda_13.0.2_580.95.05_linux_sbsa.run"
          },
          {
            "Architecture": "x86_64",
            "Uri": "https://developer.download.nvidia.com/compute/cuda/13.0.2/local_installers/cuda_13.0.2_580.95.05_linux.run"
          }
        ]
      },
      "package_id_18": {
        "Name": "nvhpc_2025_2511_Linux_aarch64_cuda_13.0",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64"
        ],
        "Type": "tarball",
        "Sources": [
          {
            "Architecture": "aarch64",
            "Uri": "https://developer.download.nvidia.com/hpc-sdk/25.11/nvhpc_2025_2511_Linux_aarch64_cuda_13.0.tar.gz"
          }
        ]
      },
      "package_id_19": {
        "Name": "slurm",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_slurm_custom"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_slurm_custom"
          }
        ]
      },
      "package_id_20": {
        "Name": "docker.io/library/busybox",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "1.36",
        "Version": "1.36"
      },
      "package_id_21": {
        "Name": "git",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_22": {
        "Name": "fuse-overlayfs",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_23": {
        "Name": "podman",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_24": {
        "Name": "kubeadm-1.34.1",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "kubernetes"
          }
        ]
      },
      "package_id_25": {
        "Name": "kubelet-1.34.1",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "kubernetes"
          }
        ]
      },
      "package_id_26": {
        "Name": "container-selinux",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_27": {
        "Name": "cri-o-1.34.1",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "cri-o"
          }
        ]
      },
      "package_id_28": {
        "Name": "docker.io/victoriametrics/victoria-metrics",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v1.128.0",
        "Version": "v1.128.0"
      },
      "package_id_29": {
        "Name": "docker.io/victoriametrics/vmagent",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v1.128.0",
        "Version": "v1.128.0"
      },
      "package_id_30": {
        "Name": "docker.io/victoriametrics/vmstorage",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v1.128.0-cluster",
        "Version": "v1.128.0-cluster"
      },
      "package_id_31": {
        "Name": "docker.io/victoriametrics/vminsert",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v1.128.0-cluster",
        "Version": "v1.128.0-cluster"
      },
      "package_id_32": {
        "Name": "docker.io/victoriametrics/vmselect",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v1.128.0-cluster",
        "Version": "v1.128.0-cluster"
      },
      "package_id_33": {
        "Name": "docker.io/alpine/kubectl",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "1.34.1",
        "Version": "1.34.1"
      },
      "package_id_34": {
        "Name": "docker.io/curlimages/curl",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "8.17.0",
        "Version": "8.17.0"
      },
      "package_id_35": {
        "Name": "docker.io/rmohr/activemq",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "5.15.9",
        "Version": "5.15.9"
      },
      "package_id_36": {
        "Name": "docker.io/library/mysql",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "9.3.0",
        "Version": "9.3.0"
      },
      "package_id_37": {
        "Name": "docker.io/dellhpcomniaaisolution/idrac_telemetry_receiver",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "1.2",
        "Version": "1.2"
      },
      "package_id_38": {
        "Name": "docker.io/dellhpcomniaaisolution/kafkapump",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "1.2",
        "Version": "1.2"
      },
      "package_id_39": {
        "Name": "docker.io/dellhpcomniaaisolution/victoriapump",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "1.2",
        "Version": "1.2"
      },
      "package_id_40": {
        "Name": "cryptography==45.0.7",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "pip_module"
      },
      "package_id_41": {
        "Name": "omsdk==1.2.518",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "pip_module"
      },
      "package_id_42": {
        "Name": "cffi==1.17.1",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "pip_module"
      },
      "package_id_43": {
        "Name": "quay.io/strimzi/operator",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "0.48.0",
        "Version": "0.48.0"
      },
      "package_id_44": {
        "Name": "quay.io/strimzi/kafka",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "0.48.0-kafka-4.1.0",
        "Version": "0.48.0-kafka-4.1.0"
      },
      "package_id_45": {
        "Name": "docker.io/dellhpcomniaaisolution/ubuntu-ldms",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "1.0",
        "Version": "1.0"
      },
      "package_id_46": {
        "Name": "strimzi-kafka-operator-helm-3-chart-0.48.0",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "tarball",
        "Sources": [
          {
            "Architecture": "x86_64",
            "Uri": "https://github.com/strimzi/strimzi-kafka-operator/releases/download/0.48.0/strimzi-kafka-operator-helm-3-chart-0.48.0.tgz"
          }
        ]
      },
      "package_id_47": {
        "Name": "quay.io/strimzi/kafka-bridge",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "0.33.1",
        "Version": "0.33.1"
      },
      "package_id_48": {
        "Name": "ghcr.io/kube-vip/kube-vip",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v0.8.9",
        "Version": "v0.8.9"
      },
      "package_id_49": {
        "Name": "registry.k8s.io/kube-apiserver",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v1.34.1",
        "Version": "v1.34.1"
      },
      "package_id_50": {
        "Name": "registry.k8s.io/kube-controller-manager",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v1.34.1",
        "Version": "v1.34.1"
      },
      "package_id_51": {
        "Name": "registry.k8s.io/kube-scheduler",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v1.34.1",
        "Version": "v1.34.1"
      },
      "package_id_52": {
        "Name": "registry.k8s.io/kube-proxy",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v1.34.1",
        "Version": "v1.34.1"
      },
      "package_id_53": {
        "Name": "registry.k8s.io/coredns/coredns",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v1.12.1",
        "Version": "v1.12.1"
      },
      "package_id_54": {
        "Name": "registry.k8s.io/pause",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "3.10.1",
        "Version": "3.10.1"
      },
      "package_id_55": {
        "Name": "registry.k8s.io/etcd",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "3.6.4-0",
        "Version": "3.6.4-0"
      },
      "package_id_56": {
        "Name": "docker.io/calico/cni",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v3.30.3",
        "Version": "v3.30.3"
      },
      "package_id_57": {
        "Name": "docker.io/calico/kube-controllers",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v3.30.3",
        "Version": "v3.30.3"
      },
      "package_id_58": {
        "Name": "docker.io/calico/node",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v3.30.3",
        "Version": "v3.30.3"
      },
      "package_id_59": {
        "Name": "quay.io/metallb/speaker",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v0.15.2",
        "Version": "v0.15.2"
      },
      "package_id_60": {
        "Name": "kubectl-1.34.1",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "kubernetes"
          }
        ]
      },
      "package_id_61": {
        "Name": "prettytable==3.14.0",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "pip_module"
      },
      "package_id_62": {
        "Name": "python3-3.12.9",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "package_id_63": {
        "Name": "kubernetes==33.1.0",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "pip_module"
      },
      "package_id_64": {
        "Name": "PyMySQL==1.1.2",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "pip_module"
      },
      "package_id_65": {
        "Name": "calico-v3.30.3",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "manifest",
        "Sources": [
          {
            "Architecture": "x86_64",
            "Uri": "https://raw.githubusercontent.com/projectcalico/calico/v3.30.3/manifests/calico.yaml"
          }
        ]
      },
      "package_id_66": {
        "Name": "metallb-native-v0.15.2",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "manifest",
        "Sources": [
          {
            "Architecture": "x86_64",
            "Uri": "https://raw.githubusercontent.com/metallb/metallb/v0.15.2/config/manifests/metallb-native.yaml"
          }
        ]
      },
      "package_id_67": {
        "Name": "helm-v3.19.0-amd64",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "tarball",
        "Sources": [
          {
            "Architecture": "x86_64",
            "Uri": "https://get.helm.sh/helm-v3.19.0-linux-amd64.tar.gz"
          }
        ]
      },
      "package_id_68": {
        "Name": "nfs-subdir-external-provisioner-4.0.18",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "tarball",
        "Sources": [
          {
            "Architecture": "x86_64",
            "Uri": "https://github.com/kubernetes-sigs/nfs-subdir-external-provisioner/releases/download/nfs-subdir-external-provisioner-4.0.18/nfs-subdir-external-provisioner-4.0.18.tgz"
          }
        ]
      },
      "package_id_69": {
        "Name": "registry.k8s.io/sig-storage/nfs-subdir-external-provisioner",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v4.0.2",
        "Version": "v4.0.2"
      },
      "package_id_70": {
        "Name": "quay.io/metallb/controller",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v0.15.2",
        "Version": "v0.15.2"
      },
      "package_id_71": {
        "Name": "iscsi-initiator-utils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "package_id_72": {
        "Name": "device-mapper-multipath",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "package_id_73": {
        "Name": "sg3_utils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "package_id_74": {
        "Name": "lsscsi",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "package_id_75": {
        "Name": "nvhpc_2025_2511_Linux_x86_64_cuda_13.0",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "tarball",
        "Sources": [
          {
            "Architecture": "x86_64",
            "Uri": "https://developer.download.nvidia.com/hpc-sdk/25.11/nvhpc_2025_2511_Linux_x86_64_cuda_13.0.tar.gz"
          }
        ]
      }
    },
    "OSPackages": {
      "os_package_id_1": {
        "Name": "which",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_2": {
        "Name": "tcpdump",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_3": {
        "Name": "traceroute",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_4": {
        "Name": "iperf3",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_5": {
        "Name": "fping",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "epel"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "epel"
          }
        ]
      },
      "os_package_id_6": {
        "Name": "dmidecode",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_7": {
        "Name": "hwloc",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_8": {
        "Name": "hwloc-libs",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_9": {
        "Name": "lshw",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_10": {
        "Name": "pciutils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_11": {
        "Name": "emacs",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_12": {
        "Name": "zsh",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_13": {
        "Name": "openssh",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_14": {
        "Name": "openssh-server",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_15": {
        "Name": "openssh-clients",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_16": {
        "Name": "rsync",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_17": {
        "Name": "file",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_18": {
        "Name": "libcurl",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_19": {
        "Name": "tar",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_20": {
        "Name": "bzip2",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_21": {
        "Name": "man-db",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_22": {
        "Name": "man-pages",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_23": {
        "Name": "strace",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_24": {
        "Name": "kexec-tools",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_25": {
        "Name": "openssl-devel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_26": {
        "Name": "ipmitool",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_27": {
        "Name": "gdb",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_28": {
        "Name": "gdb-gdbserver",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_29": {
        "Name": "lldb",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_30": {
        "Name": "lldb-devel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_31": {
        "Name": "valgrind",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_32": {
        "Name": "valgrind-devel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_33": {
        "Name": "ltrace",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_34": {
        "Name": "kernel-tools",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_35": {
        "Name": "perf",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_36": {
        "Name": "papi",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_37": {
        "Name": "papi-devel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_38": {
        "Name": "papi-libs",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_39": {
        "Name": "cmake",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_40": {
        "Name": "make",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_41": {
        "Name": "autoconf",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_42": {
        "Name": "automake",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_43": {
        "Name": "libtool",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_44": {
        "Name": "gcc",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_45": {
        "Name": "gcc-c++",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_46": {
        "Name": "gcc-gfortran",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_47": {
        "Name": "binutils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_48": {
        "Name": "binutils-devel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_49": {
        "Name": "clustershell",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "epel"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "epel"
          }
        ]
      },
      "os_package_id_50": {
        "Name": "bash-completion",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_51": {
        "Name": "systemd",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_52": {
        "Name": "systemd-udev",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_53": {
        "Name": "kernel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_54": {
        "Name": "dracut",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_55": {
        "Name": "dracut-live",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_56": {
        "Name": "dracut-network",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_57": {
        "Name": "squashfs-tools",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_58": {
        "Name": "nfs-utils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_59": {
        "Name": "nfs4-acl-tools",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_60": {
        "Name": "NetworkManager",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_61": {
        "Name": "nm-connection-editor",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_62": {
        "Name": "iproute",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_63": {
        "Name": "iputils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_64": {
        "Name": "curl",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_65": {
        "Name": "bash",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_66": {
        "Name": "coreutils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_67": {
        "Name": "grep",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_68": {
        "Name": "sed",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_69": {
        "Name": "gawk",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_70": {
        "Name": "findutils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_71": {
        "Name": "util-linux",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_72": {
        "Name": "kbd",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_73": {
        "Name": "lsof",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_74": {
        "Name": "cryptsetup",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_75": {
        "Name": "lvm2",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_76": {
        "Name": "device-mapper",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_77": {
        "Name": "rsyslog",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_78": {
        "Name": "chrony",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_79": {
        "Name": "sudo",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_80": {
        "Name": "gzip",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_81": {
        "Name": "wget",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_82": {
        "Name": "cloud-init",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_83": {
        "Name": "glibc-langpack-en",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_84": {
        "Name": "gedit",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "epel"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "epel"
          }
        ]
      },
      "os_package_id_85": {
        "Name": "docker.io/dellhpcomniaaisolution/image-build-aarch64",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64"
        ],
        "Type": "image",
        "Tag": "1.1",
        "Version": "1.1"
      },
      "os_package_id_86": {
        "Name": "python3-devel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_87": {
        "Name": "python3-cython",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_codeready-builder"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_codeready-builder"
          }
        ]
      },
      "os_package_id_88": {
        "Name": "openssl-libs",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_89": {
        "Name": "ovis-ldms",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_ldms"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_ldms"
          }
        ]
      },
      "os_package_id_90": {
        "Name": "openldap-clients",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_91": {
        "Name": "nss-pam-ldapd",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "epel"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "epel"
          }
        ]
      },
      "os_package_id_92": {
        "Name": "sssd",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_93": {
        "Name": "oddjob-mkhomedir",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_94": {
        "Name": "authselect",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_95": {
        "Name": "docker.io/dellhpcomniaaisolution/image-build-el10",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "1.1",
        "Version": "1.1"
      }
    },
    "Miscellaneous": [],
    "InfrastructurePackages": {}
  }
}

================================================
FILE: build_stream/core/catalog/test_fixtures/functional_layer.json
================================================
{
  "service_kube_control_plane_x86_64": {
    "packages": [
      {"package": "ghcr.io/kube-vip/kube-vip", "type": "image", "tag": "v0.8.9", "architecture": ["x86_64"]},
      {"package": "docker.io/alpine/kubectl", "type": "image", "tag": "1.34.1", "architecture": ["x86_64"]},
      {"package": "registry.k8s.io/kube-apiserver", "type": "image", "tag": "v1.34.1", "architecture": ["x86_64"]},
      {"package": "registry.k8s.io/kube-controller-manager", "type": "image", "tag": "v1.34.1", "architecture": ["x86_64"]},
      {"package": "registry.k8s.io/kube-scheduler", "type": "image", "tag": "v1.34.1", "architecture": ["x86_64"]},
      {"package": "registry.k8s.io/kube-proxy", "type": "image", "tag": "v1.34.1", "architecture": ["x86_64"]},
      {"package": "registry.k8s.io/coredns/coredns", "type": "image", "tag": "v1.12.1", "architecture": ["x86_64"]},
      {"package": "registry.k8s.io/pause", "type": "image", "tag": "3.10.1", "architecture": ["x86_64"]},
      {"package": "registry.k8s.io/etcd", "type": "image", "tag": "3.6.4-0", "architecture": ["x86_64"]},
      {"package": "docker.io/calico/cni", "type": "image", "tag": "v3.30.3", "architecture": ["x86_64"]},
      {"package": "docker.io/calico/kube-controllers", "type": "image", "tag": "v3.30.3", "architecture": ["x86_64"]},
      {"package": "docker.io/calico/node", "type": "image", "tag": "v3.30.3", "architecture": ["x86_64"]},
      {"package": "quay.io/metallb/speaker", "type": "image", "tag": "v0.15.2", "architecture": ["x86_64"]},
      {"package": "kubectl-1.34.1", "type": "rpm", "repo_name": "kubernetes", "architecture": ["x86_64"]},
      {"package": "prettytable==3.14.0", "type": "pip_module", "architecture": ["x86_64"]},
      {"package": "python3.12", "type": "rpm", "repo_name": "x86_64_appstream", "architecture": ["x86_64"]},
      {"package": "git", "type": "rpm", "repo_name": "x86_64_appstream", "architecture": ["x86_64"]},
      {"package": "kubernetes==33.1.0", "type": "pip_module", "architecture": ["x86_64"]},
      {"package": "PyMySQL==1.1.2", "type": "pip_module", "architecture": ["x86_64"]},
      {"package": "calico-v3.30.3", "type": "manifest", "url": "https://raw.githubusercontent.com/projectcalico/calico/v3.30.3/manifests/calico.yaml", "architecture": ["x86_64"]},
      {"package": "metallb-native-v0.15.2", "type": "manifest", "url": "https://raw.githubusercontent.com/metallb/metallb/v0.15.2/config/manifests/metallb-native.yaml", "architecture": ["x86_64"]},
      {"package": "helm-v3.19.0-amd64", "type": "tarball", "url": "https://get.helm.sh/helm-v3.19.0-linux-amd64.tar.gz", "architecture": ["x86_64"]},
      {"package": "nfs-subdir-external-provisioner-4.0.18", "type": "tarball", "url": "https://github.com/kubernetes-sigs/nfs-subdir-external-provisioner/releases/download/nfs-subdir-external-provisioner-4.0.18/nfs-subdir-external-provisioner-4.0.18.tgz", "architecture": ["x86_64"]}
    ]
  },
  "service_kube_node_x86_64": {
    "packages": [
      {"package": "registry.k8s.io/sig-storage/nfs-subdir-external-provisioner", "type": "image", "tag": "v4.0.2", "architecture": ["x86_64"]},
      {"package": "quay.io/metallb/speaker", "type": "image", "tag": "v0.15.2", "architecture": ["x86_64"]},
      {"package": "quay.io/metallb/controller", "type": "image", "tag": "v0.15.2", "architecture": ["x86_64"]}
    ]
  },
  "login_node_x86_64": {
    "packages": [
      {"package": "slurm-slurmd", "type": "rpm", "repo_name": "x86_64_slurm_custom", "architecture": ["x86_64"]},
      {"package": "slurm", "type": "rpm", "repo_name": "x86_64_slurm_custom", "architecture": ["x86_64"]}
    ]
  },
  "login_node_aarch64": {
    "packages": [
      {"package": "slurm-slurmd", "type": "rpm", "repo_name": "aarch64_slurm_custom", "architecture": ["aarch64"]},
      {"package": "slurm", "type": "rpm", "repo_name": "aarch64_slurm_custom", "architecture": ["aarch64"]}
    ]
  },
  "login_compiler_node_x86_64": {
    "packages": [
      {"package": "slurm", "type": "rpm", "repo_name": "x86_64_slurm_custom", "architecture": ["x86_64"]},
      {"package": "slurm-slurmd", "type": "rpm", "repo_name": "x86_64_slurm_custom", "architecture": ["x86_64"]}
    ]
  },
  "login_compiler_node_aarch64": {
    "packages": [
      {"package": "slurm", "type": "rpm", "repo_name": "aarch64_slurm_custom", "architecture": ["aarch64"]},
      {"package": "slurm-slurmd", "type": "rpm", "repo_name": "aarch64_slurm_custom", "architecture": ["aarch64"]}
    ]
  },
  "slurm_control_node_x86_64": {
    "packages": [
      {"package": "slurm-slurmctld", "type": "rpm", "repo_name": "x86_64_slurm_custom", "architecture": ["x86_64"]},
      {"package": "slurm-slurmdbd", "type": "rpm", "repo_name": "x86_64_slurm_custom", "architecture": ["x86_64"]},
      {"package": "python3-PyMySQL", "type": "rpm", "repo_name": "x86_64_appstream", "architecture": ["x86_64"]},
      {"package": "mariadb-server", "type": "rpm", "repo_name": "x86_64_appstream", "architecture": ["x86_64"]},
      {"package": "iscsi-initiator-utils", "type": "rpm", "repo_name": "x86_64_baseos", "architecture": ["x86_64"]},
      {"package": "device-mapper-multipath", "type": "rpm", "repo_name": "x86_64_baseos", "architecture": ["x86_64"]},
      {"package": "sg3_utils", "type": "rpm", "repo_name": "x86_64_baseos", "architecture": ["x86_64"]},
      {"package": "lsscsi", "type": "rpm", "repo_name": "x86_64_baseos", "architecture": ["x86_64"]}
    ]
  },
  "slurm_node_x86_64": {
    "packages": [
      {"package": "slurm-slurmd", "type": "rpm", "repo_name": "x86_64_slurm_custom", "architecture": ["x86_64"]},
      {"package": "slurm-pam_slurm", "type": "rpm", "repo_name": "x86_64_slurm_custom", "architecture": ["x86_64"]},
      {"package": "kernel-devel", "type": "rpm", "repo_name": "x86_64_appstream", "architecture": ["x86_64"]},
      {"package": "kernel-headers", "type": "rpm", "repo_name": "x86_64_appstream", "architecture": ["x86_64"]},
      {"package": "cuda-run", "type": "iso", "url": "https://developer.download.nvidia.com/compute/cuda/13.0.2/local_installers/cuda_13.0.2_580.95.05_linux.run", "architecture": ["x86_64"]}
    ]
  },
  "slurm_node_aarch64": {
    "packages": [
      {"package": "slurm-slurmd", "type": "rpm", "repo_name": "aarch64_slurm_custom", "architecture": ["aarch64"]},
      {"package": "slurm-pam_slurm", "type": "rpm", "repo_name": "aarch64_slurm_custom", "architecture": ["aarch64"]},
      {"package": "kernel-devel", "type": "rpm", "repo_name": "aarch64_appstream", "architecture": ["aarch64"]},
      {"package": "kernel-headers", "type": "rpm", "repo_name": "aarch64_appstream", "architecture": ["aarch64"]},
      {"package": "cuda-run", "type": "iso", "url": "https://developer.download.nvidia.com/compute/cuda/13.0.2/local_installers/cuda_13.0.2_580.95.05_linux_sbsa.run", "architecture": ["aarch64"]}
    ]
  }
}


================================================
FILE: build_stream/core/catalog/tests/sample.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Example script showing programmatic usage of the generator and adapter APIs.

This script runs the catalog feature-list generator and adapter config generator
directly from Python, configuring logging and handling common errors.
"""

import logging
import os

from catalog_parser.generator import generate_root_json_from_catalog, get_functional_layer_roles_from_file, get_package_list
from catalog_parser.adapter import generate_omnia_json_from_catalog
from catalog_parser.adapter_policy import generate_configs_from_policy

BASE_DIR = os.path.dirname(os.path.dirname(__file__))
CATALOG_PARSER_DIR = os.path.join(BASE_DIR, "")
CATALOG_PATH = os.path.join(CATALOG_PARSER_DIR, "test_fixtures", "catalog_rhel.json")
SCHEMA_PATH = os.path.join(CATALOG_PARSER_DIR, "resources", "CatalogSchema.json")
FUNCTIONAL_LAYER_PATH = os.path.join(CATALOG_PARSER_DIR, "test_fixtures", "functional_layer.json")
ADAPTER_POLICY_PATH = os.path.join(CATALOG_PARSER_DIR, "resources", "adapter_policy_default.json")
ADAPTER_POLICY_SCHEMA_PATH = os.path.join(CATALOG_PARSER_DIR, "resources", "AdapterPolicySchema.json")

try:
    generate_root_json_from_catalog(
        catalog_path=CATALOG_PATH,
        schema_path=SCHEMA_PATH,
        output_root="out/generator2",
        configure_logging=True,
        log_file="logs/generator.log",
        log_level=logging.INFO,
    )

    generate_omnia_json_from_catalog(
        catalog_path=CATALOG_PATH,
        schema_path=SCHEMA_PATH,
        output_root="out/adapter/config2",
        configure_logging=True,
        log_file="logs/adapter.log",
        log_level=logging.INFO,
    )

    generate_configs_from_policy(
        input_dir="out/generator2",
        output_dir="out/adapter_policy/config2",
        policy_path=ADAPTER_POLICY_PATH,
        schema_path=ADAPTER_POLICY_SCHEMA_PATH,
        configure_logging=True,
        log_file="logs/adapter_policy.log",
        log_level=logging.INFO,
    )

    roles = get_functional_layer_roles_from_file(FUNCTIONAL_LAYER_PATH)
    print(f"Functional layer roles: {roles}")

    # Get packages for a specific role
    result = get_package_list(FUNCTIONAL_LAYER_PATH, role="K8S Controller")
    print(f"Packages for role 'K8S Controller': {result}")

    # Get packages for all roles
    result = get_package_list(FUNCTIONAL_LAYER_PATH)
    print(f"Packages for all roles: {result}")

except FileNotFoundError as e:
    # handle missing catalog/schema
    print(f"Missing file: {e}")
except Exception as e:
    # handle generic processing errors
    print(f"Processing failed: {e}")

================================================
FILE: build_stream/core/catalog/tests/test_adapter_cli_defaults.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import os
import sys
import tempfile
import unittest

HERE = os.path.dirname(__file__)
CATALOG_PARSER_DIR = os.path.dirname(HERE)
PROJECT_ROOT = os.path.dirname(CATALOG_PARSER_DIR)
if PROJECT_ROOT not in sys.path:
    sys.path.insert(0, PROJECT_ROOT)

from catalog_parser.adapter import generate_omnia_json_from_catalog, _DEFAULT_SCHEMA_PATH


class TestAdapterDefaults(unittest.TestCase):
    def test_default_schema_path_points_to_resources(self):
        catalog_parser_dir = os.path.dirname(os.path.dirname(__file__))
        expected_schema = os.path.join(catalog_parser_dir, "resources", "CatalogSchema.json")
        self.assertEqual(os.path.abspath(_DEFAULT_SCHEMA_PATH), os.path.abspath(expected_schema))

    def test_generate_omnia_json_with_defaults_writes_output(self):
        catalog_parser_dir = os.path.dirname(os.path.dirname(__file__))
        catalog_path = os.path.join(catalog_parser_dir, "test_fixtures", "catalog_rhel.json")

        with tempfile.TemporaryDirectory() as tmpdir:
            generate_omnia_json_from_catalog(
                catalog_path=catalog_path,
                output_root=tmpdir,
            )

            # We expect some JSON files under arch/os/version
            found_any_json = False
            for root, dirs, files in os.walk(tmpdir):
                if any(f.endswith('.json') for f in files):
                    found_any_json = True
                    break

            self.assertTrue(found_any_json, "No JSON configs generated under any arch/os/version")


if __name__ == "__main__":
    unittest.main()


================================================
FILE: build_stream/core/catalog/tests/test_adapter_policy.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for adapter_policy module."""

import json
import os
import sys
import tempfile
import unittest

HERE = os.path.dirname(__file__)
CATALOG_PARSER_DIR = os.path.dirname(HERE)
PROJECT_ROOT = os.path.dirname(CATALOG_PARSER_DIR)
if PROJECT_ROOT not in sys.path:
    sys.path.insert(0, PROJECT_ROOT)

from catalog_parser.adapter_policy import (
    validate_policy_config,
    discover_architectures,
    discover_os_versions,
    transform_package,
    apply_substring_filter,
    compute_common_packages,
    apply_extract_common_filter,
    apply_extract_unique_filter,
    apply_filter,
    merge_transform,
    compute_common_keys_from_roles,
    derive_common_role,
    check_conditions,
    process_target_spec,
    write_config_file,
    generate_configs_from_policy,
    _DEFAULT_POLICY_PATH,
    _DEFAULT_SCHEMA_PATH,
)
from catalog_parser import adapter_policy_schema_consts as schema


class TestValidatePolicyConfig(unittest.TestCase):
    """Tests for validate_policy_config function."""

    def setUp(self):
        self.valid_policy = {
            "version": "2.0.0",
            "targets": {
                "test.json": {
                    "sources": [
                        {
                            "source_file": "source.json",
                            "pulls": [{"source_key": "role1"}]
                        }
                    ]
                }
            }
        }
        self.schema_path = _DEFAULT_SCHEMA_PATH
        with open(self.schema_path, "r", encoding="utf-8") as f:
            self.schema_config = json.load(f)

    def test_valid_policy_passes_validation(self):
        """Valid policy should not raise any exception."""
        validate_policy_config(
            self.valid_policy,
            self.schema_config,
            policy_path="test_policy.json",
            schema_path=self.schema_path
        )

    def test_missing_version_raises_error(self):
        """Policy missing required 'version' field should raise ValueError."""
        invalid_policy = {"targets": {}}
        with self.assertRaises(ValueError) as ctx:
            validate_policy_config(
                invalid_policy,
                self.schema_config,
                policy_path="test_policy.json",
                schema_path=self.schema_path
            )
        self.assertIn("Adapter policy validation failed", str(ctx.exception))
        self.assertIn("version", str(ctx.exception))

    def test_missing_targets_raises_error(self):
        """Policy missing required 'targets' field should raise ValueError."""
        invalid_policy = {"version": "2.0.0"}
        with self.assertRaises(ValueError) as ctx:
            validate_policy_config(
                invalid_policy,
                self.schema_config,
                policy_path="test_policy.json",
                schema_path=self.schema_path
            )
        self.assertIn("Adapter policy validation failed", str(ctx.exception))
        self.assertIn("targets", str(ctx.exception))

    def test_invalid_target_spec_raises_error(self):
        """Target spec missing 'sources' should raise ValueError."""
        invalid_policy = {
            "version": "2.0.0",
            "targets": {
                "test.json": {}
            }
        }
        with self.assertRaises(ValueError) as ctx:
            validate_policy_config(
                invalid_policy,
                self.schema_config,
                policy_path="test_policy.json",
                schema_path=self.schema_path
            )
        self.assertIn("Adapter policy validation failed", str(ctx.exception))

    def test_allowlist_filter_policy_validates(self):
        """Policy using allowlist filter type should validate against schema."""
        policy = {
            "version": "2.0.0",
            "targets": {
                "openldap.json": {
                    "sources": [
                        {
                            "source_file": "base_os.json",
                            "pulls": [
                                {
                                    "source_key": "Base OS",
                                    "filter": {
                                        "type": "allowlist",
                                        "field": "package",
                                        "values": ["openldap-clients"],
                                        "case_sensitive": False,
                                    },
                                }
                            ],
                        }
                    ]
                }
            },
        }

        validate_policy_config(
            policy,
            self.schema_config,
            policy_path="test_policy.json",
            schema_path=self.schema_path,
        )

    def test_field_in_filter_policy_validates(self):
        """Policy using field_in filter type should validate against schema."""
        policy = {
            "version": "2.0.0",
            "targets": {
                "openldap.json": {
                    "sources": [
                        {
                            "source_file": "base_os.json",
                            "pulls": [
                                {
                                    "source_key": "Base OS",
                                    "filter": {
                                        "type": "field_in",
                                        "field": "feature",
                                        "values": ["openldap"],
                                        "case_sensitive": False,
                                    },
                                }
                            ],
                        }
                    ]
                }
            },
        }

        validate_policy_config(
            policy,
            self.schema_config,
            policy_path="test_policy.json",
            schema_path=self.schema_path,
        )

    def test_any_of_filter_requires_filters(self):
        """any_of filter must define nested filters."""
        policy = {
            "version": "2.0.0",
            "targets": {
                "openldap.json": {
                    "sources": [
                        {
                            "source_file": "base_os.json",
                            "pulls": [
                                {"source_key": "Base OS", "filter": {"type": "any_of"}}
                            ],
                        }
                    ]
                }
            },
        }

        with self.assertRaises(ValueError) as ctx:
            validate_policy_config(
                policy,
                self.schema_config,
                policy_path="test_policy.json",
                schema_path=self.schema_path,
            )
        self.assertIn("Adapter policy validation failed", str(ctx.exception))

    def test_any_of_filter_policy_validates(self):
        """Policy using any_of filter type should validate against schema."""
        policy = {
            "version": "2.0.0",
            "targets": {
                "openldap.json": {
                    "sources": [
                        {
                            "source_file": "base_os.json",
                            "pulls": [
                                {
                                    "source_key": "Base OS",
                                    "filter": {
                                        "type": "any_of",
                                        "filters": [
                                            {"type": "substring", "values": ["ldap"]},
                                            {"type": "field_in", "field": "feature", "values": ["openldap"]},
                                        ],
                                    },
                                }
                            ],
                        }
                    ]
                }
            },
        }

        validate_policy_config(
            policy,
            self.schema_config,
            policy_path="test_policy.json",
            schema_path=self.schema_path,
        )


class TestDiscoverArchitectures(unittest.TestCase):
    """Tests for discover_architectures function."""

    def test_discovers_architecture_directories(self):
        """Should return list of subdirectory names."""
        with tempfile.TemporaryDirectory() as tmpdir:
            os.makedirs(os.path.join(tmpdir, "x86_64"))
            os.makedirs(os.path.join(tmpdir, "aarch64"))
            # Create a file (should be ignored)
            with open(os.path.join(tmpdir, "readme.txt"), "w") as f:
                f.write("test")

            archs = discover_architectures(tmpdir)
            self.assertEqual(sorted(archs), ["aarch64", "x86_64"])

    def test_returns_empty_for_nonexistent_dir(self):
        """Should return empty list for non-existent directory."""
        archs = discover_architectures("/nonexistent/path")
        self.assertEqual(archs, [])

    def test_returns_empty_for_empty_dir(self):
        """Should return empty list for empty directory."""
        with tempfile.TemporaryDirectory() as tmpdir:
            archs = discover_architectures(tmpdir)
            self.assertEqual(archs, [])


class TestDiscoverOsVersions(unittest.TestCase):
    """Tests for discover_os_versions function."""

    def test_discovers_os_and_versions(self):
        """Should return list of (os_family, version) tuples."""
        with tempfile.TemporaryDirectory() as tmpdir:
            os.makedirs(os.path.join(tmpdir, "x86_64", "rhel", "9.0"))
            os.makedirs(os.path.join(tmpdir, "x86_64", "rhel", "8.0"))
            os.makedirs(os.path.join(tmpdir, "x86_64", "ubuntu", "22.04"))

            results = discover_os_versions(tmpdir, "x86_64")
            self.assertEqual(len(results), 3)
            self.assertIn(("rhel", "9.0"), results)
            self.assertIn(("rhel", "8.0"), results)
            self.assertIn(("ubuntu", "22.04"), results)

    def test_returns_empty_for_nonexistent_arch(self):
        """Should return empty list for non-existent architecture."""
        with tempfile.TemporaryDirectory() as tmpdir:
            results = discover_os_versions(tmpdir, "nonexistent")
            self.assertEqual(results, [])


class TestTransformPackage(unittest.TestCase):
    """Tests for transform_package function."""

    def test_no_transform_returns_copy(self):
        """No transform config should return a copy of the package."""
        pkg = {"name": "test", "version": "1.0"}
        result = transform_package(pkg, None)
        self.assertEqual(result, pkg)
        self.assertIsNot(result, pkg)

    def test_exclude_fields(self):
        """Should exclude specified fields."""
        pkg = {"name": "test", "version": "1.0", "architecture": "x86_64"}
        transform = {schema.EXCLUDE_FIELDS: ["architecture"]}
        result = transform_package(pkg, transform)
        self.assertEqual(result, {"name": "test", "version": "1.0"})

    def test_rename_fields(self):
        """Should rename specified fields."""
        pkg = {"name": "test", "ver": "1.0"}
        transform = {schema.RENAME_FIELDS: {"ver": "version"}}
        result = transform_package(pkg, transform)
        self.assertEqual(result, {"name": "test", "version": "1.0"})

    def test_exclude_and_rename_combined(self):
        """Should apply both exclude and rename."""
        pkg = {"name": "test", "ver": "1.0", "arch": "x86_64"}
        transform = {
            schema.EXCLUDE_FIELDS: ["arch"],
            schema.RENAME_FIELDS: {"ver": "version"}
        }
        result = transform_package(pkg, transform)
        self.assertEqual(result, {"name": "test", "version": "1.0"})


class TestApplySubstringFilter(unittest.TestCase):
    """Tests for apply_substring_filter function."""

    def test_filters_by_substring(self):
        """Should filter packages by substring match."""
        packages = [
            {"package": "kubernetes-client"},
            {"package": "kubernetes-server"},
            {"package": "docker-ce"},
        ]
        filter_config = {
            schema.FIELD: "package",
            schema.VALUES: ["kubernetes"]
        }
        result = apply_substring_filter(packages, filter_config)
        self.assertEqual(len(result), 2)
        self.assertTrue(all("kubernetes" in p["package"] for p in result))

    def test_case_insensitive_by_default(self):
        """Should be case-insensitive by default."""
        packages = [
            {"package": "Kubernetes-Client"},
            {"package": "docker-ce"},
        ]
        filter_config = {
            schema.FIELD: "package",
            schema.VALUES: ["kubernetes"]
        }
        result = apply_substring_filter(packages, filter_config)
        self.assertEqual(len(result), 1)

    def test_case_sensitive_when_specified(self):
        """Should be case-sensitive when specified."""
        packages = [
            {"package": "Kubernetes-Client"},
            {"package": "kubernetes-server"},
        ]
        filter_config = {
            schema.FIELD: "package",
            schema.VALUES: ["kubernetes"],
            schema.CASE_SENSITIVE: True
        }
        result = apply_substring_filter(packages, filter_config)
        self.assertEqual(len(result), 1)
        self.assertEqual(result[0]["package"], "kubernetes-server")

    def test_empty_values_returns_all(self):
        """Empty values list should return all packages."""
        packages = [{"package": "test1"}, {"package": "test2"}]
        filter_config = {schema.FIELD: "package", schema.VALUES: []}
        result = apply_substring_filter(packages, filter_config)
        self.assertEqual(result, packages)


class TestAllowlistAndFieldFilters(unittest.TestCase):
    def test_allowlist_matches_exact_package_names(self):
        packages = [
            {"package": "openldap-clients"},
            {"package": "openldap-servers"},
            {"package": "openmpi"},
        ]
        filter_config = {
            schema.TYPE: schema.ALLOWLIST_FILTER,
            schema.FIELD: "package",
            schema.VALUES: ["openldap-clients"],
            schema.CASE_SENSITIVE: False,
        }

        result = apply_filter(packages, {}, "Base OS", filter_config)
        self.assertEqual([p["package"] for p in result], ["openldap-clients"])

    def test_field_in_matches_classification_field(self):
        packages = [
            {"package": "vendor-ldap", "feature": "openldap"},
            {"package": "vendor-ldap2", "feature": "other"},
            {"package": "no-feature"},
        ]
        filter_config = {
            schema.TYPE: schema.FIELD_IN_FILTER,
            schema.FIELD: "feature",
            schema.VALUES: ["openldap"],
            schema.CASE_SENSITIVE: False,
        }

        result = apply_filter(packages, {}, "Base OS", filter_config)
        self.assertEqual([p["package"] for p in result], ["vendor-ldap"])

    def test_any_of_combines_multiple_strategies(self):
        packages = [
            {"package": "openldap-clients"},
            {"package": "vendor-ldap", "feature": "openldap"},
            {"package": "slapd-utils"},
            {"package": "unrelated"},
        ]

        filter_config = {
            schema.TYPE: schema.ANY_OF_FILTER,
            schema.FILTERS: [
                {
                    schema.TYPE: schema.ALLOWLIST_FILTER,
                    schema.FIELD: "package",
                    schema.VALUES: ["openldap-clients"],
                    schema.CASE_SENSITIVE: False,
                },
                {
                    schema.TYPE: schema.FIELD_IN_FILTER,
                    schema.FIELD: "feature",
                    schema.VALUES: ["openldap"],
                    schema.CASE_SENSITIVE: False,
                },
                {
                    schema.TYPE: schema.SUBSTRING_FILTER,
                    schema.FIELD: "package",
                    schema.VALUES: ["slapd"],
                    schema.CASE_SENSITIVE: False,
                },
            ],
        }

        result = apply_filter(packages, {}, "Base OS", filter_config)
        self.assertEqual(
            [p["package"] for p in result],
            ["openldap-clients", "vendor-ldap", "slapd-utils"],
        )


class TestComputeCommonPackages(unittest.TestCase):
    """Tests for compute_common_packages function."""

    def test_finds_common_packages(self):
        """Should find packages common across multiple keys."""
        source_data = {
            "role1": {schema.PACKAGES: [
                {"name": "common-pkg", "version": "1.0"},
                {"name": "unique1", "version": "1.0"},
            ]},
            "role2": {schema.PACKAGES: [
                {"name": "common-pkg", "version": "1.0"},
                {"name": "unique2", "version": "1.0"},
            ]},
        }
        common_keys, key_to_pkg = compute_common_packages(
            source_data, ["role1", "role2"], min_occurrences=2
        )
        self.assertEqual(len(common_keys), 1)

    def test_respects_min_occurrences(self):
        """Should respect min_occurrences threshold."""
        source_data = {
            "role1": {schema.PACKAGES: [{"name": "pkg1"}]},
            "role2": {schema.PACKAGES: [{"name": "pkg1"}]},
            "role3": {schema.PACKAGES: [{"name": "pkg2"}]},
        }
        common_keys, _ = compute_common_packages(
            source_data, ["role1", "role2", "role3"], min_occurrences=3
        )
        self.assertEqual(len(common_keys), 0)


class TestMergeTransform(unittest.TestCase):
    """Tests for merge_transform function."""

    def test_none_inputs_return_none(self):
        """Both None should return None."""
        self.assertIsNone(merge_transform(None, None))

    def test_base_only(self):
        """Only base should return base."""
        base = {schema.EXCLUDE_FIELDS: ["arch"]}
        self.assertEqual(merge_transform(base, None), base)

    def test_override_only(self):
        """Only override should return override."""
        override = {schema.EXCLUDE_FIELDS: ["arch"]}
        self.assertEqual(merge_transform(None, override), override)

    def test_override_wins(self):
        """Override values should win."""
        base = {schema.EXCLUDE_FIELDS: ["arch"]}
        override = {schema.EXCLUDE_FIELDS: ["version"]}
        result = merge_transform(base, override)
        self.assertEqual(result[schema.EXCLUDE_FIELDS], ["version"])


class TestCheckConditions(unittest.TestCase):
    """Tests for check_conditions function."""

    def test_no_conditions_returns_true(self):
        """No conditions should always return True."""
        self.assertTrue(check_conditions(None, "x86_64", "rhel", "9.0"))

    def test_architecture_condition(self):
        """Should check architecture condition."""
        conditions = {schema.ARCHITECTURES: ["x86_64"]}
        self.assertTrue(check_conditions(conditions, "x86_64", "rhel", "9.0"))
        self.assertFalse(check_conditions(conditions, "aarch64", "rhel", "9.0"))

    def test_os_family_condition(self):
        """Should check OS family condition."""
        conditions = {schema.OS_FAMILIES: ["rhel"]}
        self.assertTrue(check_conditions(conditions, "x86_64", "rhel", "9.0"))
        self.assertFalse(check_conditions(conditions, "x86_64", "ubuntu", "22.04"))

    def test_os_version_condition(self):
        """Should check OS version condition."""
        conditions = {schema.OS_VERSIONS: ["9.0"]}
        self.assertTrue(check_conditions(conditions, "x86_64", "rhel", "9.0"))
        self.assertFalse(check_conditions(conditions, "x86_64", "rhel", "8.0"))

    def test_multiple_conditions_all_must_pass(self):
        """All conditions must pass."""
        conditions = {
            schema.ARCHITECTURES: ["x86_64"],
            schema.OS_FAMILIES: ["rhel"],
            schema.OS_VERSIONS: ["9.0"]
        }
        self.assertTrue(check_conditions(conditions, "x86_64", "rhel", "9.0"))
        self.assertFalse(check_conditions(conditions, "aarch64", "rhel", "9.0"))


class TestDeriveCommonRole(unittest.TestCase):
    """Tests for derive_common_role function."""

    def test_derives_common_packages(self):
        """Should derive common packages into new role."""
        target_roles = {
            "role1": [{"name": "common"}, {"name": "unique1"}],
            "role2": [{"name": "common"}, {"name": "unique2"}],
        }
        derive_common_role(
            target_roles,
            derived_key="common_role",
            from_keys=["role1", "role2"],
            min_occurrences=2,
            remove_from_sources=True
        )
        self.assertIn("common_role", target_roles)
        self.assertEqual(len(target_roles["common_role"]), 1)
        self.assertEqual(target_roles["common_role"][0]["name"], "common")

    def test_removes_from_sources_when_specified(self):
        """Should remove common packages from source roles."""
        target_roles = {
            "role1": [{"name": "common"}, {"name": "unique1"}],
            "role2": [{"name": "common"}, {"name": "unique2"}],
        }
        derive_common_role(
            target_roles,
            derived_key="common_role",
            from_keys=["role1", "role2"],
            min_occurrences=2,
            remove_from_sources=True
        )
        self.assertEqual(len(target_roles["role1"]), 1)
        self.assertEqual(target_roles["role1"][0]["name"], "unique1")

    def test_keeps_sources_when_not_removing(self):
        """Should keep source packages when remove_from_sources=False."""
        target_roles = {
            "role1": [{"name": "common"}, {"name": "unique1"}],
            "role2": [{"name": "common"}, {"name": "unique2"}],
        }
        derive_common_role(
            target_roles,
            derived_key="common_role",
            from_keys=["role1", "role2"],
            min_occurrences=2,
            remove_from_sources=False
        )
        self.assertEqual(len(target_roles["role1"]), 2)


class TestWriteConfigFile(unittest.TestCase):
    """Tests for write_config_file function."""

    def test_writes_valid_json(self):
        """Should write valid JSON file."""
        with tempfile.TemporaryDirectory() as tmpdir:
            file_path = os.path.join(tmpdir, "subdir", "test.json")
            config = {
                "role1": {schema.CLUSTER: [{"name": "pkg1"}]},
                "role2": {schema.CLUSTER: [{"name": "pkg2"}]},
            }
            write_config_file(file_path, config)

            self.assertTrue(os.path.exists(file_path))
            with open(file_path, "r", encoding="utf-8") as f:
                loaded = json.load(f)
            self.assertEqual(loaded["role1"][schema.CLUSTER][0]["name"], "pkg1")

    def test_creates_parent_directories(self):
        """Should create parent directories if they don't exist."""
        with tempfile.TemporaryDirectory() as tmpdir:
            file_path = os.path.join(tmpdir, "a", "b", "c", "test.json")
            config = {"role1": {schema.CLUSTER: []}}
            write_config_file(file_path, config)
            self.assertTrue(os.path.exists(file_path))


class TestGenerateConfigsFromPolicy(unittest.TestCase):
    """Tests for generate_configs_from_policy function."""

    def setUp(self):
        self.test_fixtures_dir = os.path.join(CATALOG_PARSER_DIR, "test_fixtures")
        self.test_policy_path = os.path.join(self.test_fixtures_dir, "adapter_policy_test.json")

    def test_generates_output_files(self):
        """Should generate output JSON files from valid policy."""
        with tempfile.TemporaryDirectory() as tmpdir:
            # Create input directory structure
            input_dir = os.path.join(tmpdir, "input")
            output_dir = os.path.join(tmpdir, "output")
            os.makedirs(os.path.join(input_dir, "x86_64", "rhel", "9.0"))

            # Create source file
            source_data = {
                "Base OS": {
                    schema.PACKAGES: [
                        {"package": "test-pkg", "version": "1.0"}
                    ]
                }
            }
            with open(os.path.join(input_dir, "x86_64", "rhel", "9.0", "base_os.json"), "w") as f:
                json.dump(source_data, f)

            # Create minimal policy
            policy = {
                "version": "2.0.0",
                "targets": {
                    "output.json": {
                        "sources": [{
                            "source_file": "base_os.json",
                            "pulls": [{"source_key": "Base OS", "target_key": "base_role"}]
                        }]
                    }
                }
            }
            policy_path = os.path.join(tmpdir, "policy.json")
            with open(policy_path, "w") as f:
                json.dump(policy, f)

            generate_configs_from_policy(
                input_dir=input_dir,
                output_dir=output_dir,
                policy_path=policy_path,
                schema_path=_DEFAULT_SCHEMA_PATH
            )

            output_file = os.path.join(output_dir, "x86_64", "rhel", "9.0", "output.json")
            self.assertTrue(os.path.exists(output_file))

    def test_generates_openldap_with_any_of_filter(self):
        with tempfile.TemporaryDirectory() as tmpdir:
            input_dir = os.path.join(tmpdir, "input")
            output_dir = os.path.join(tmpdir, "output")
            os.makedirs(os.path.join(input_dir, "x86_64", "rhel", "9.0"))

            source_data = {
                "Base OS": {
                    schema.PACKAGES: [
                        {"package": "openldap-clients", "type": "rpm", "architecture": ["x86_64"]},
                        {"package": "vendor-directory-client", "type": "rpm", "architecture": ["x86_64"], "feature": "openldap"},
                        {"package": "slapd-utils", "type": "rpm", "architecture": ["x86_64"]},
                        {"package": "bash", "type": "rpm", "architecture": ["x86_64"]},
                    ]
                }
            }
            with open(os.path.join(input_dir, "x86_64", "rhel", "9.0", "base_os.json"), "w") as f:
                json.dump(source_data, f)

            policy = {
                "version": "2.0.0",
                "targets": {
                    "openldap.json": {
                        "transform": {"exclude_fields": ["architecture"]},
                        "sources": [
                            {
                                "source_file": "base_os.json",
                                "pulls": [
                                    {
                                        "source_key": "Base OS",
                                        "target_key": "openldap",
                                        "filter": {
                                            "type": "any_of",
                                            "filters": [
                                                {"type": "allowlist", "field": "package", "values": ["openldap-clients"], "case_sensitive": False},
                                                {"type": "field_in", "field": "feature", "values": ["openldap"], "case_sensitive": False},
                                                {"type": "substring", "field": "package", "values": ["slapd"], "case_sensitive": False},
                                            ],
                                        },
                                    }
                                ],
                            }
                        ],
                    }
                },
            }
            policy_path = os.path.join(tmpdir, "policy.json")
            with open(policy_path, "w") as f:
                json.dump(policy, f)

            generate_configs_from_policy(
                input_dir=input_dir,
                output_dir=output_dir,
                policy_path=policy_path,
                schema_path=_DEFAULT_SCHEMA_PATH,
            )

            output_file = os.path.join(output_dir, "x86_64", "rhel", "9.0", "openldap.json")
            self.assertTrue(os.path.exists(output_file))

            with open(output_file, "r", encoding="utf-8") as f:
                out_json = json.load(f)

            self.assertIn("openldap", out_json)
            pkgs = out_json["openldap"][schema.CLUSTER]

            self.assertEqual(
                [p.get("package") for p in pkgs],
                ["openldap-clients", "vendor-directory-client", "slapd-utils"],
            )
            self.assertTrue(all("architecture" not in p for p in pkgs))

    def test_invalid_policy_raises_error(self):
        """Should raise ValueError for invalid policy."""
        with tempfile.TemporaryDirectory() as tmpdir:
            input_dir = os.path.join(tmpdir, "input")
            output_dir = os.path.join(tmpdir, "output")
            os.makedirs(input_dir)

            # Create invalid policy (missing version)
            invalid_policy = {"targets": {}}
            policy_path = os.path.join(tmpdir, "invalid_policy.json")
            with open(policy_path, "w") as f:
                json.dump(invalid_policy, f)

            with self.assertRaises(ValueError) as ctx:
                generate_configs_from_policy(
                    input_dir=input_dir,
                    output_dir=output_dir,
                    policy_path=policy_path,
                    schema_path=_DEFAULT_SCHEMA_PATH
                )
            self.assertIn("Adapter policy validation failed", str(ctx.exception))

    def test_missing_input_dir_raises_file_not_found(self):
        """Should raise FileNotFoundError if input_dir does not exist."""
        with tempfile.TemporaryDirectory() as tmpdir:
            output_dir = os.path.join(tmpdir, "output")
            missing_input_dir = os.path.join(tmpdir, "does_not_exist")

            with self.assertRaises(FileNotFoundError):
                generate_configs_from_policy(
                    input_dir=missing_input_dir,
                    output_dir=output_dir,
                    policy_path=_DEFAULT_POLICY_PATH,
                    schema_path=_DEFAULT_SCHEMA_PATH,
                )

    def test_missing_policy_file_raises_file_not_found(self):
        """Should raise FileNotFoundError if policy_path does not exist."""
        with tempfile.TemporaryDirectory() as tmpdir:
            input_dir = os.path.join(tmpdir, "input")
            output_dir = os.path.join(tmpdir, "output")
            os.makedirs(input_dir)

            missing_policy_path = os.path.join(tmpdir, "missing_policy.json")

            with self.assertRaises(FileNotFoundError):
                generate_configs_from_policy(
                    input_dir=input_dir,
                    output_dir=output_dir,
                    policy_path=missing_policy_path,
                    schema_path=_DEFAULT_SCHEMA_PATH,
                )

    def test_missing_schema_file_raises_file_not_found(self):
        """Should raise FileNotFoundError if schema_path does not exist."""
        with tempfile.TemporaryDirectory() as tmpdir:
            input_dir = os.path.join(tmpdir, "input")
            output_dir = os.path.join(tmpdir, "output")
            os.makedirs(input_dir)

            missing_schema_path = os.path.join(tmpdir, "missing_schema.json")

            with self.assertRaises(FileNotFoundError):
                generate_configs_from_policy(
                    input_dir=input_dir,
                    output_dir=output_dir,
                    policy_path=_DEFAULT_POLICY_PATH,
                    schema_path=missing_schema_path,
                )


class TestDefaultPaths(unittest.TestCase):
    """Tests for default path constants."""

    def test_default_policy_path_exists(self):
        """Default policy path should point to existing file."""
        self.assertTrue(
            os.path.exists(_DEFAULT_POLICY_PATH),
            f"Default policy file not found: {_DEFAULT_POLICY_PATH}"
        )

    def test_default_schema_path_exists(self):
        """Default schema path should point to existing file."""
        self.assertTrue(
            os.path.exists(_DEFAULT_SCHEMA_PATH),
            f"Default schema file not found: {_DEFAULT_SCHEMA_PATH}"
        )

    def test_default_policy_validates_against_schema(self):
        """Default policy should validate against default schema."""
        with open(_DEFAULT_POLICY_PATH, "r", encoding="utf-8") as f:
            policy = json.load(f)
        with open(_DEFAULT_SCHEMA_PATH, "r", encoding="utf-8") as f:
            schema_config = json.load(f)

        # Should not raise
        validate_policy_config(
            policy,
            schema_config,
            policy_path=_DEFAULT_POLICY_PATH,
            schema_path=_DEFAULT_SCHEMA_PATH
        )


class TestProcessTargetSpec(unittest.TestCase):
    """Tests for process_target_spec function."""

    def test_processes_simple_target(self):
        """Should process a simple target specification."""
        source_files = {
            "source.json": {
                "role1": {schema.PACKAGES: [{"name": "pkg1"}]}
            }
        }
        target_spec = {
            "sources": [{
                "source_file": "source.json",
                "pulls": [{"source_key": "role1", "target_key": "output_role"}]
            }]
        }
        target_configs = {}

        process_target_spec(
            target_file="output.json",
            target_spec=target_spec,
            source_files=source_files,
            target_configs=target_configs,
            arch="x86_64",
            os_family="rhel",
            os_version="9.0"
        )

        self.assertIn("output.json", target_configs)
        self.assertIn("output_role", target_configs["output.json"])

    def test_skips_when_conditions_not_met(self):
        """Should skip target when conditions are not met."""
        source_files = {"source.json": {"role1": {schema.PACKAGES: []}}}
        target_spec = {
            "conditions": {schema.ARCHITECTURES: ["aarch64"]},
            "sources": [{
                "source_file": "source.json",
                "pulls": [{"source_key": "role1"}]
            }]
        }
        target_configs = {}

        process_target_spec(
            target_file="output.json",
            target_spec=target_spec,
            source_files=source_files,
            target_configs=target_configs,
            arch="x86_64",
            os_family="rhel",
            os_version="9.0"
        )

        self.assertNotIn("output.json", target_configs)

    def test_applies_transform(self):
        """Should apply transform to packages."""
        source_files = {
            "source.json": {
                "role1": {schema.PACKAGES: [
                    {"name": "pkg1", "architecture": "x86_64"}
                ]}
            }
        }
        target_spec = {
            "transform": {schema.EXCLUDE_FIELDS: ["architecture"]},
            "sources": [{
                "source_file": "source.json",
                "pulls": [{"source_key": "role1", "target_key": "output_role"}]
            }]
        }
        target_configs = {}

        process_target_spec(
            target_file="output.json",
            target_spec=target_spec,
            source_files=source_files,
            target_configs=target_configs,
            arch="x86_64",
            os_family="rhel",
            os_version="9.0"
        )

        pkgs = target_configs["output.json"]["output_role"][schema.CLUSTER]
        self.assertNotIn("architecture", pkgs[0])


if __name__ == "__main__":
    unittest.main()


================================================
FILE: build_stream/core/catalog/tests/test_generator_cli_defaults.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import os
import sys
import tempfile
import unittest

HERE = os.path.dirname(__file__)
CATALOG_PARSER_DIR = os.path.dirname(HERE)
PROJECT_ROOT = os.path.dirname(CATALOG_PARSER_DIR)
if PROJECT_ROOT not in sys.path:
    sys.path.insert(0, PROJECT_ROOT)

from catalog_parser.generator import generate_root_json_from_catalog, _DEFAULT_SCHEMA_PATH


class TestGeneratorDefaults(unittest.TestCase):
    def test_default_schema_path_points_to_resources(self):
        catalog_parser_dir = os.path.dirname(os.path.dirname(__file__))
        expected_schema = os.path.join(catalog_parser_dir, "resources", "CatalogSchema.json")
        self.assertEqual(os.path.abspath(_DEFAULT_SCHEMA_PATH), os.path.abspath(expected_schema))

    def test_generate_root_json_with_defaults_writes_output(self):
        catalog_parser_dir = os.path.dirname(os.path.dirname(__file__))
        catalog_path = os.path.join(catalog_parser_dir, "test_fixtures", "catalog_rhel.json")

        with tempfile.TemporaryDirectory() as tmpdir:
            generate_root_json_from_catalog(
                catalog_path=catalog_path,
                output_root=tmpdir,
            )

            # We expect at least one arch/os/version directory with functional_layer.json
            found = False
            for root, dirs, files in os.walk(tmpdir):
                if "functional_layer.json" in files:
                    found = True
                    break

            self.assertTrue(found, "functional_layer.json not generated under any arch/os/version")


if __name__ == "__main__":
    unittest.main()


================================================
FILE: build_stream/core/catalog/tests/test_generator_package_list.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for get_package_list function in generator module."""

import json
import os
import sys
import tempfile
import unittest

from jsonschema import ValidationError

HERE = os.path.dirname(__file__)
CATALOG_PARSER_DIR = os.path.dirname(HERE)
PROJECT_ROOT = os.path.dirname(CATALOG_PARSER_DIR)
if PROJECT_ROOT not in sys.path:
    sys.path.insert(0, PROJECT_ROOT)

from catalog_parser.generator import (
    FeatureList,
    serialize_json,
    get_package_list,
)


class TestGetPackageList(unittest.TestCase):
    """Tests for get_package_list function."""

    def setUp(self):
        """Set up test fixtures."""
        self.base_dir = os.path.dirname(__file__)
        self.fixture_path = os.path.abspath(
            os.path.join(self.base_dir, "..", "test_fixtures", "functional_layer.json")
        )

    def test_get_packages_for_valid_single_role(self):
        """TC01: Given a valid role, returns list with one role object containing packages."""
        result = get_package_list(self.fixture_path, role="Compiler")

        self.assertIsInstance(result, list)
        self.assertEqual(len(result), 1)
        self.assertEqual(result[0]["roleName"], "Compiler")
        self.assertIn("packages", result[0])
        self.assertIsInstance(result[0]["packages"], list)
        self.assertGreater(len(result[0]["packages"]), 0)

    def test_get_packages_for_all_roles_when_role_is_none(self):
        """TC02: When role is None, returns list with all role objects."""
        result = get_package_list(self.fixture_path, role=None)

        self.assertIsInstance(result, list)
        # Fixture has 6 roles
        expected_roles = [
            "Compiler",
            "K8S Controller",
            "K8S Worker",
            "Login Node",
            "Slurm Controller",
            "Slurm Worker",
        ]
        actual_roles = [r["roleName"] for r in result]
        self.assertCountEqual(actual_roles, expected_roles)

    def test_invalid_role_raises_value_error(self):
        """TC03: Invalid/unknown role raises ValueError with clear message."""
        with self.assertRaises(ValueError) as context:
            get_package_list(self.fixture_path, role="NonExistentRole")

        self.assertIn("NonExistentRole", str(context.exception))

    def test_empty_role_raises_value_error(self):
        """Empty role string is treated as invalid input."""
        with self.assertRaises(ValueError) as context:
            get_package_list(self.fixture_path, role="")

        self.assertIn("non-empty", str(context.exception))

    def test_file_not_found_raises_error(self):
        """TC04: Non-existent file raises FileNotFoundError."""
        with self.assertRaises(FileNotFoundError):
            get_package_list("/nonexistent/path/functional_layer.json")

    def test_malformed_json_raises_error(self):
        """TC05: Malformed JSON raises json.JSONDecodeError."""
        with tempfile.TemporaryDirectory() as tmp_dir:
            malformed_path = os.path.join(tmp_dir, "malformed.json")
            with open(malformed_path, "w", encoding="utf-8") as f:
                f.write("{ invalid json }")

            with self.assertRaises(json.JSONDecodeError):
                get_package_list(malformed_path)

    def test_schema_validation_failure_raises_error(self):
        """TC06: JSON that fails schema validation raises ValidationError."""
        with tempfile.TemporaryDirectory() as tmp_dir:
            # Missing required 'architecture' field for a package item
            invalid_json = {
                "SomeRole": {
                    "packages": [
                        {
                            "package": "firewalld",
                            "type": "rpm",
                            "repo_name": "x86_64_baseos",
                            # Missing 'architecture' field
                        }
                    ]
                }
            }
            json_path = os.path.join(tmp_dir, "invalid_schema.json")
            with open(json_path, "w", encoding="utf-8") as f:
                json.dump(invalid_json, f)

            with self.assertRaises(ValidationError):
                get_package_list(json_path)

    def test_empty_feature_list_returns_empty_list(self):
        """TC07: Empty feature list returns empty list."""
        with tempfile.TemporaryDirectory() as tmp_dir:
            empty_feature_list = FeatureList(features={})
            json_path = os.path.join(tmp_dir, "empty_functional_layer.json")
            serialize_json(empty_feature_list, json_path)

            result = get_package_list(json_path)

            self.assertEqual(result, [])

    def test_package_attributes_are_complete(self):
        """TC08: All package fields are present in the response."""
        result = get_package_list(self.fixture_path, role="Compiler")

        self.assertEqual(len(result), 1)
        packages = result[0]["packages"]
        self.assertGreater(len(packages), 0)

        # Check first package has all required fields
        first_pkg = packages[0]
        required_fields = ["name", "type", "repo_name", "architecture", "uri", "tag"]
        for field in required_fields:
            self.assertIn(field, first_pkg, f"Missing field: {field}")

    def test_package_with_uri_and_tag(self):
        """Verify packages with uri and tag fields are correctly returned."""
        result = get_package_list(self.fixture_path, role="K8S Controller")

        packages = result[0]["packages"]
        # Find a package with tag (image type)
        image_pkgs = [p for p in packages if p["type"] == "image"]
        self.assertGreater(len(image_pkgs), 0)
        # Image packages should have tag
        self.assertIsNotNone(image_pkgs[0].get("tag"))

        # Find a package with uri (tarball type)
        tarball_pkgs = [p for p in packages if p["type"] == "tarball"]
        self.assertGreater(len(tarball_pkgs), 0)
        # Tarball packages should have uri
        self.assertIsNotNone(tarball_pkgs[0].get("uri"))

    def test_role_with_spaces_in_name(self):
        """Verify roles with spaces in name work correctly."""
        result = get_package_list(self.fixture_path, role="K8S Controller")

        self.assertEqual(len(result), 1)
        self.assertEqual(result[0]["roleName"], "K8S Controller")

    def test_all_roles_returns_correct_package_counts(self):
        """Verify each role returns the correct number of packages."""
        result = get_package_list(self.fixture_path, role=None)

        # Verify we have packages for each role
        for role_obj in result:
            self.assertIn("roleName", role_obj)
            self.assertIn("packages", role_obj)
            # Each role should have at least one package
            self.assertGreater(
                len(role_obj["packages"]),
                0,
                f"Role {role_obj['roleName']} has no packages",
            )

    def test_case_insensitive_role_matching_lowercase(self):
        """Verify role matching is case-insensitive with lowercase input."""
        result = get_package_list(self.fixture_path, role="compiler")

        self.assertEqual(len(result), 1)
        # Should return the original role name from JSON
        self.assertEqual(result[0]["roleName"], "Compiler")

    def test_case_insensitive_role_matching_uppercase(self):
        """Verify role matching is case-insensitive with uppercase input."""
        result = get_package_list(self.fixture_path, role="COMPILER")

        self.assertEqual(len(result), 1)
        self.assertEqual(result[0]["roleName"], "Compiler")

    def test_case_insensitive_role_matching_mixed_case(self):
        """Verify role matching is case-insensitive with mixed case input."""
        result = get_package_list(self.fixture_path, role="k8s controller")

        self.assertEqual(len(result), 1)
        self.assertEqual(result[0]["roleName"], "K8S Controller")

    def test_case_insensitive_role_matching_preserves_original_name(self):
        """Verify the returned roleName preserves the original case from JSON."""
        result = get_package_list(self.fixture_path, role="SLURM CONTROLLER")

        self.assertEqual(len(result), 1)
        # Should preserve original case from JSON
        self.assertEqual(result[0]["roleName"], "Slurm Controller")


if __name__ == "__main__":
    unittest.main()


================================================
FILE: build_stream/core/catalog/tests/test_generator_roles.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import os
import sys
import tempfile
import unittest
from jsonschema import ValidationError

HERE = os.path.dirname(__file__)
CATALOG_PARSER_DIR = os.path.dirname(HERE)
PROJECT_ROOT = os.path.dirname(CATALOG_PARSER_DIR)
if PROJECT_ROOT not in sys.path:
    sys.path.insert(0, PROJECT_ROOT)

from catalog_parser.generator import (
    FeatureList,
    serialize_json,
    get_functional_layer_roles_from_file,
)


class TestGetFunctionalLayerRolesFromFile(unittest.TestCase):
    def test_returns_all_role_names_from_fixture(self):
        base_dir = os.path.dirname(__file__)
        fixture_path = os.path.abspath(
            os.path.join(base_dir, "..", "test_fixtures", "functional_layer.json")
        )

        roles = get_functional_layer_roles_from_file(fixture_path)

        expected_roles = [
            "Compiler",
            "K8S Controller",
            "K8S Worker",
            "Login Node",
            "Slurm Controller",
            "Slurm Worker",
        ]

        self.assertCountEqual(roles, expected_roles)

    def test_empty_feature_list_returns_empty_roles(self):
        with tempfile.TemporaryDirectory() as tmp_dir:
            empty_feature_list = FeatureList(features={})
            json_path = os.path.join(tmp_dir, "functional_layer.json")
            serialize_json(empty_feature_list, json_path)

            roles = get_functional_layer_roles_from_file(json_path)

            self.assertEqual(roles, [])

    def test_invalid_functional_layer_json_fails_schema_validation(self):
        with tempfile.TemporaryDirectory() as tmp_dir:
            # Missing required 'architecture' field for a package item
            invalid_json = {
                "SomeRole": {
                    "packages": [
                        {
                            "package": "firewalld",
                            "type": "rpm",
                            "repo_name": "x86_64_baseos",
                        }
                    ]
                }
            }
            json_path = os.path.join(tmp_dir, "functional_layer_invalid.json")
            with open(json_path, "w") as f:
                import json

                json.dump(invalid_json, f)

            with self.assertRaises(ValidationError):
                get_functional_layer_roles_from_file(json_path)


if __name__ == "__main__":
    unittest.main()


================================================
FILE: build_stream/core/catalog/tests/test_parser_defaults.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import os
import sys
import unittest

HERE = os.path.dirname(__file__)
CATALOG_PARSER_DIR = os.path.dirname(HERE)
PROJECT_ROOT = os.path.dirname(CATALOG_PARSER_DIR)
if PROJECT_ROOT not in sys.path:
    sys.path.insert(0, PROJECT_ROOT)

from catalog_parser.parser import ParseCatalog, _DEFAULT_SCHEMA_PATH


class TestParseCatalogDefaults(unittest.TestCase):
    def test_default_schema_path_points_to_resources(self):
        catalog_parser_dir = os.path.dirname(os.path.dirname(__file__))
        expected_schema = os.path.join(catalog_parser_dir, "resources", "CatalogSchema.json")
        self.assertEqual(os.path.abspath(_DEFAULT_SCHEMA_PATH), os.path.abspath(expected_schema))

    def test_parse_catalog_with_explicit_paths_uses_fixture(self):
        catalog_parser_dir = os.path.dirname(os.path.dirname(__file__))
        catalog_path = os.path.join(catalog_parser_dir, "test_fixtures", "catalog_rhel.json")
        schema_path = os.path.join(catalog_parser_dir, "resources", "CatalogSchema.json")

        catalog = ParseCatalog(catalog_path, schema_path)
        self.assertGreater(len(catalog.functional_packages), 0)


if __name__ == "__main__":
    unittest.main()


================================================
FILE: build_stream/core/catalog/utils.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Utility functions for the catalog parser package."""

import json
import logging
import os
from typing import Any, Optional


def _configure_logging(log_file: Optional[str] = None, log_level: int = logging.INFO) -> None:
    """Configure root logging.

    If log_file is provided, logs are written to that file and the directory is
    created if needed; otherwise logs go to stderr.

    Note: This function clears existing handlers before configuring, allowing
    multiple calls with different log files to work correctly.
    """
    root_logger = logging.getLogger()

    # Remove existing handlers to allow reconfiguration
    for handler in root_logger.handlers[:]:
        root_logger.removeHandler(handler)
        handler.close()

    if log_file:
        log_dir = os.path.dirname(log_file)
        if log_dir:
            os.makedirs(log_dir, exist_ok=True)
        logging.basicConfig(
            level=log_level,
            format="%(asctime)s - %(name)s - %(levelname)s - %(message)s",
            filename=log_file,
            encoding="utf-8",
            force=True,
        )
    else:
        logging.basicConfig(
            level=log_level,
            format="%(asctime)s - %(name)s - %(levelname)s - %(message)s",
            force=True,
        )


def load_json_file(file_path: str) -> Any:
    """Load and parse a JSON file.

    Args:
        file_path: Path to the JSON file to load.

    Returns:
        The parsed JSON data (dict, list, or other JSON-compatible type).

    Raises:
        FileNotFoundError: If the file does not exist.
        json.JSONDecodeError: If the file contains invalid JSON.
    """
    with open(file_path, "r", encoding="utf-8") as json_file:
        return json.load(json_file)


================================================
FILE: build_stream/core/common/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


================================================
FILE: build_stream/core/exceptions.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Core exceptions for the Build Stream API."""


class ClientDisabledError(Exception):
    """Exception raised when client account is disabled."""


class InvalidClientError(Exception):
    """Exception raised when client credentials are invalid."""


class InvalidScopeError(Exception):
    """Exception raised when requested scope is not allowed."""


class TokenCreationError(Exception):
    """Exception raised when token creation fails."""


================================================
FILE: build_stream/core/jobs/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Job domain module for Build Stream."""

from .entities import Job, Stage, IdempotencyRecord, AuditEvent
from .exceptions import (
    JobDomainError,
    JobNotFoundError,
    JobAlreadyExistsError,
    InvalidStateTransitionError,
    TerminalStateViolationError,
    IdempotencyConflictError,
)
from .repositories import (
    JobRepository,
    StageRepository,
    IdempotencyRepository,
    AuditEventRepository,
    JobIdGenerator,
    UUIDGenerator,
)
from .services import FingerprintService
from .value_objects import (
    JobId,
    CorrelationId,
    IdempotencyKey,
    StageName,
    StageType,
    RequestFingerprint,
    ClientId,
    JobState,
)

__all__ = [
    "Job",
    "Stage",
    "IdempotencyRecord",
    "AuditEvent",
    "JobDomainError",
    "JobNotFoundError",
    "JobAlreadyExistsError",
    "InvalidStateTransitionError",
    "TerminalStateViolationError",
    "IdempotencyConflictError",
    "JobRepository",
    "StageRepository",
    "IdempotencyRepository",
    "AuditEventRepository",
    "JobIdGenerator",
    "UUIDGenerator",
    "FingerprintService",
    "JobId",
    "CorrelationId",
    "IdempotencyKey",
    "StageName",
    "StageType",
    "RequestFingerprint",
    "ClientId",
    "JobState",
]


================================================
FILE: build_stream/core/jobs/entities/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Job domain entities."""

from .job import Job
from .stage import Stage
from .idempotency import IdempotencyRecord
from .audit import AuditEvent

__all__ = ["Job", "Stage", "IdempotencyRecord", "AuditEvent"]


================================================
FILE: build_stream/core/jobs/entities/audit.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Audit event entity."""

from dataclasses import dataclass, field
from datetime import datetime

from ..value_objects import ClientId, CorrelationId, JobId


@dataclass(frozen=True)
class AuditEvent:
    """Immutable audit event record.

    Captures significant domain events for audit trail and compliance.

    Attributes:
        event_id: Unique event identifier.
        job_id: Associated job identifier.
        event_type: Type of event (e.g., JOB_CREATED, STAGE_COMPLETED).
        correlation_id: Request correlation identifier.
        client_id: Client who triggered the event.
        timestamp: Event occurrence timestamp.
        details: Additional event-specific details.
    """

    event_id: str
    job_id: JobId
    event_type: str
    correlation_id: CorrelationId
    client_id: ClientId
    timestamp: datetime
    details: dict = field(default_factory=dict)


================================================
FILE: build_stream/core/jobs/entities/idempotency.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Idempotency tracking record entity."""

from dataclasses import dataclass
from datetime import datetime

from ..value_objects import ClientId, IdempotencyKey, JobId, RequestFingerprint


@dataclass(frozen=True)
class IdempotencyRecord:
    """Idempotency tracking record.

    Immutable record linking idempotency key to job and request fingerprint.
    Used for request deduplication and retry safety.

    Attributes:
        idempotency_key: Client-provided deduplication token.
        job_id: Associated job identifier.
        request_fingerprint: SHA-256 hash of normalized request.
        client_id: Client who created the request.
        created_at: Record creation timestamp.
        expires_at: Record expiration timestamp.
    """

    idempotency_key: IdempotencyKey
    job_id: JobId
    request_fingerprint: RequestFingerprint
    client_id: ClientId
    created_at: datetime
    expires_at: datetime

    def is_expired(self, current_time: datetime) -> bool:
        """Check if record has expired.

        Args:
            current_time: Current timestamp for comparison.

        Returns:
            True if record is expired.
        """
        return current_time >= self.expires_at

    def matches_fingerprint(self, fingerprint: RequestFingerprint) -> bool:
        """Check if fingerprint matches this record.

        Args:
            fingerprint: Request fingerprint to compare.

        Returns:
            True if fingerprints match.
        """
        return self.request_fingerprint == fingerprint


================================================
FILE: build_stream/core/jobs/entities/job.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Job aggregate root entity."""

from dataclasses import dataclass
from datetime import datetime, timezone
from typing import Optional

from ..exceptions import InvalidStateTransitionError, TerminalStateViolationError
from ..value_objects import ClientId, JobId, JobState


@dataclass
class Job:
    """Job aggregate root.

    Represents a build workflow execution with lifecycle management,
    state tracking, and optimistic locking.

    Attributes:
        job_id: Unique job identifier.
        client_id: Client who owns this job (from auth).
        request_client_id: Client ID from request payload.
        job_state: Current lifecycle state.
        client_name: Optional client name.
        created_at: Job creation timestamp.
        updated_at: Last modification timestamp.
        version: Optimistic locking version.
        tombstoned: Soft delete flag.
    """

    job_id: JobId
    client_id: ClientId
    request_client_id: str
    client_name: Optional[str] = None
    job_state: JobState = JobState.CREATED
    created_at: Optional[datetime] = None
    updated_at: Optional[datetime] = None
    version: int = 1
    tombstoned: bool = False

    def __post_init__(self) -> None:
        if self.created_at is None:
            self.created_at = datetime.now(timezone.utc)
        if self.updated_at is None:
            self.updated_at = self.created_at

    def _validate_transition(
        self,
        allowed_states: set[JobState],
        target_state: JobState
    ) -> None:
        """Validate state transition is allowed.

        Args:
            allowed_states: States from which transition is valid.
            target_state: Desired target state.

        Raises:
            TerminalStateViolationError: If in terminal state.
            InvalidStateTransitionError: If transition invalid.
        """
        if self.job_state.is_terminal():
            raise TerminalStateViolationError(
                entity_type="Job",
                entity_id=str(self.job_id),
                state=self.job_state.value
            )

        if self.job_state not in allowed_states:
            raise InvalidStateTransitionError(
                entity_type="Job",
                entity_id=str(self.job_id),
                from_state=self.job_state.value,
                to_state=target_state.value
            )

    def _update_metadata(self) -> None:
        """Update timestamp and version after state change."""
        self.updated_at = datetime.now(timezone.utc)
        self.version += 1

    def start(self) -> None:
        """Transition job from CREATED to IN_PROGRESS.

        Raises:
            InvalidStateTransitionError: If not in CREATED state.
            TerminalStateViolationError: If in terminal state.
        """
        self._validate_transition({JobState.CREATED}, JobState.IN_PROGRESS)
        self.job_state = JobState.IN_PROGRESS
        self._update_metadata()

    def complete(self) -> None:
        """Transition job to COMPLETED state.

        Raises:
            InvalidStateTransitionError: If not in IN_PROGRESS state.
            TerminalStateViolationError: If already in terminal state.
        """
        self._validate_transition({JobState.IN_PROGRESS}, JobState.COMPLETED)
        self.job_state = JobState.COMPLETED
        self._update_metadata()

    def fail(self) -> None:
        """Transition job to FAILED state.

        Raises:
            InvalidStateTransitionError: If not in IN_PROGRESS state.
            TerminalStateViolationError: If already in terminal state.
        """
        self._validate_transition({JobState.IN_PROGRESS}, JobState.FAILED)
        self.job_state = JobState.FAILED
        self._update_metadata()

    def cancel(self) -> None:
        """Transition job to CANCELLED state.

        Can be called from CREATED or IN_PROGRESS states.

        Raises:
            InvalidStateTransitionError: If not in valid state for cancellation.
            TerminalStateViolationError: If already in terminal state.
        """
        self._validate_transition(
            {JobState.CREATED, JobState.IN_PROGRESS},
            JobState.CANCELLED
        )
        self.job_state = JobState.CANCELLED
        self._update_metadata()

    def tombstone(self) -> None:
        """Mark job as tombstoned (soft delete).

        Tombstoned jobs cannot be modified but remain queryable.
        """
        self.tombstoned = True
        self._update_metadata()

    def is_completed(self) -> bool:
        """Check if job is in COMPLETED state."""
        return self.job_state == JobState.COMPLETED

    def is_failed(self) -> bool:
        """Check if job is in FAILED state."""
        return self.job_state == JobState.FAILED

    def is_cancelled(self) -> bool:
        """Check if job is in CANCELLED state."""
        return self.job_state == JobState.CANCELLED

    def is_in_progress(self) -> bool:
        """Check if job is in IN_PROGRESS state."""
        return self.job_state == JobState.IN_PROGRESS


================================================
FILE: build_stream/core/jobs/entities/stage.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Stage entity within Job aggregate."""

from dataclasses import dataclass
from datetime import datetime, timezone
from typing import Optional

from ..exceptions import InvalidStateTransitionError, TerminalStateViolationError
from ..value_objects import JobId, StageName, StageState


@dataclass
class Stage:
    """Stage entity within Job aggregate.

    Represents a single stage execution with state tracking,
    error handling, and retry support.

    Attributes:
        job_id: Parent job identifier.
        stage_name: Stage identifier.
        stage_state: Current execution state.
        attempt: Execution attempt number (1-indexed).
        started_at: Stage start timestamp.
        ended_at: Stage end timestamp.
        error_code: Error code if failed.
        error_summary: Error description if failed.
        log_file_path: Ansible log file path on OIM host (NFS share).
        version: Optimistic locking version.
    """

    job_id: JobId
    stage_name: StageName
    stage_state: StageState = StageState.PENDING
    attempt: int = 1
    started_at: Optional[datetime] = None
    ended_at: Optional[datetime] = None
    error_code: Optional[str] = None
    error_summary: Optional[str] = None
    log_file_path: Optional[str] = None
    version: int = 1

    def _initialize_timestamps(self) -> None:
        """Initialize timestamps when not provided (rehydration support)."""
        # Note: Stages don't auto-stamp on creation like Jobs
        # because they start as PENDING and get stamped when actually started/ended
        # No initialization needed for stages

    def _validate_transition(
        self,
        allowed_states: set[StageState],
        target_state: StageState
    ) -> None:
        """Validate state transition is allowed.

        Args:
            allowed_states: States from which transition is valid.
            target_state: Desired target state.

        Raises:
            TerminalStateViolationError: If in terminal state.
            InvalidStateTransitionError: If transition invalid.
        """
        if self.stage_state.is_terminal():
            raise TerminalStateViolationError(
                entity_type="Stage",
                entity_id=f"{self.job_id}/{self.stage_name}",
                state=self.stage_state.value
            )

        if self.stage_state not in allowed_states:
            raise InvalidStateTransitionError(
                entity_type="Stage",
                entity_id=f"{self.job_id}/{self.stage_name}",
                from_state=self.stage_state.value,
                to_state=target_state.value
            )

    def _mark_started(self) -> None:
        """Mark stage as started."""
        self.started_at = datetime.now(timezone.utc)
        self.version += 1

    def _mark_ended(self) -> None:
        """Mark stage as ended."""
        self.ended_at = datetime.now(timezone.utc)
        self.version += 1

    def start(self) -> None:
        """Transition stage from PENDING to IN_PROGRESS.

        Raises:
            InvalidStateTransitionError: If not in PENDING state.
            TerminalStateViolationError: If in terminal state.
        """
        self._validate_transition({StageState.PENDING}, StageState.IN_PROGRESS)
        self.stage_state = StageState.IN_PROGRESS
        self._mark_started()

    def complete(self) -> None:
        """Transition stage to COMPLETED state.

        Raises:
            InvalidStateTransitionError: If not in IN_PROGRESS state.
            TerminalStateViolationError: If already in terminal state.
        """
        self._validate_transition({StageState.IN_PROGRESS}, StageState.COMPLETED)
        self.stage_state = StageState.COMPLETED
        self._mark_ended()

    def fail(self, error_code: str, error_summary: str) -> None:
        """Transition stage to FAILED state with error details.

        Args:
            error_code: Error classification code.
            error_summary: Human-readable error description.

        Raises:
            InvalidStateTransitionError: If not in IN_PROGRESS state.
            TerminalStateViolationError: If already in terminal state.
        """
        self._validate_transition({StageState.IN_PROGRESS}, StageState.FAILED)
        self.stage_state = StageState.FAILED
        self.error_code = error_code
        self.error_summary = error_summary
        self._mark_ended()

    def skip(self) -> None:
        """Transition stage to SKIPPED state.

        Raises:
            InvalidStateTransitionError: If not in PENDING state.
            TerminalStateViolationError: If already in terminal state.
        """
        self._validate_transition({StageState.PENDING}, StageState.SKIPPED)
        self.stage_state = StageState.SKIPPED
        self._mark_ended()

    def cancel(self) -> None:
        """Transition stage to CANCELLED state.

        Can be called from PENDING or IN_PROGRESS states.

        Raises:
            InvalidStateTransitionError: If not in valid state for cancellation.
            TerminalStateViolationError: If already in terminal state.
        """
        self._validate_transition(
            {StageState.PENDING, StageState.IN_PROGRESS},
            StageState.CANCELLED
        )
        self.stage_state = StageState.CANCELLED
        self._mark_ended()


================================================
FILE: build_stream/core/jobs/exceptions.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Domain exceptions for Job aggregate."""

from typing import Optional


class JobDomainError(Exception):
    """Base exception for all job domain errors."""

    def __init__(self, message: str, correlation_id: Optional[str] = None) -> None:
        """Initialize domain error.

        Args:
            message: Human-readable error description.
            correlation_id: Optional correlation ID for tracing.
        """
        super().__init__(message)
        self.message = message
        self.correlation_id = correlation_id


class JobNotFoundError(JobDomainError):
    """Job does not exist in the system."""

    def __init__(self, job_id: str, correlation_id: Optional[str] = None) -> None:
        """Initialize job not found error.

        Args:
            job_id: The job ID that was not found.
            correlation_id: Optional correlation ID for tracing.
        """
        super().__init__(
            f"Job not found: {job_id}",
            correlation_id=correlation_id
        )
        self.job_id = job_id


class JobAlreadyExistsError(JobDomainError):
    """Job with the given ID already exists."""

    def __init__(self, job_id: str, correlation_id: Optional[str] = None) -> None:
        """Initialize job already exists error.

        Args:
            job_id: The job ID that already exists.
            correlation_id: Optional correlation ID for tracing.
        """
        super().__init__(
            f"Job already exists: {job_id}",
            correlation_id=correlation_id
        )
        self.job_id = job_id


class InvalidStateTransitionError(JobDomainError):
    """Attempted state transition is not valid."""

    def __init__(
        self,
        entity_type: str,
        entity_id: str,
        from_state: str,
        to_state: str,
        correlation_id: Optional[str] = None
    ) -> None:
        """Initialize invalid state transition error.

        Args:
            entity_type: Type of entity (Job or Stage).
            entity_id: Identifier of the entity.
            from_state: Current state.
            to_state: Attempted target state.
            correlation_id: Optional correlation ID for tracing.
        """
        super().__init__(
            f"Invalid {entity_type} state transition for {entity_id}: "
            f"{from_state} -> {to_state}",
            correlation_id=correlation_id
        )
        self.entity_type = entity_type
        self.entity_id = entity_id
        self.from_state = from_state
        self.to_state = to_state


class TerminalStateViolationError(JobDomainError):
    """Attempted to modify an entity in a terminal state."""

    def __init__(
        self,
        entity_type: str,
        entity_id: str,
        state: str,
        correlation_id: Optional[str] = None
    ) -> None:
        """Initialize terminal state violation error.

        Args:
            entity_type: Type of entity (Job or Stage).
            entity_id: Identifier of the entity.
            state: Current terminal state.
            correlation_id: Optional correlation ID for tracing.
        """
        super().__init__(
            f"Cannot modify {entity_type} {entity_id} in terminal state: {state}",
            correlation_id=correlation_id
        )
        self.entity_type = entity_type
        self.entity_id = entity_id
        self.state = state


class OptimisticLockError(JobDomainError):
    """Version conflict detected during update."""

    def __init__(
        self,
        entity_type: str,
        entity_id: str,
        expected_version: int,
        actual_version: int,
        correlation_id: Optional[str] = None
    ) -> None:
        """Initialize optimistic lock error.

        Args:
            entity_type: Type of entity (Job or Stage).
            entity_id: Identifier of the entity.
            expected_version: Version expected by the client.
            actual_version: Current version in the system.
            correlation_id: Optional correlation ID for tracing.
        """
        super().__init__(
            f"Version conflict for {entity_type} {entity_id}: "
            f"expected {expected_version}, found {actual_version}",
            correlation_id=correlation_id
        )
        self.entity_type = entity_type
        self.entity_id = entity_id
        self.expected_version = expected_version
        self.actual_version = actual_version


class IdempotencyConflictError(JobDomainError):
    """Idempotency key conflict with different request fingerprint."""

    def __init__(
        self,
        idempotency_key: str,
        existing_job_id: str,
        correlation_id: Optional[str] = None
    ) -> None:
        """Initialize idempotency conflict error.

        Args:
            idempotency_key: The conflicting idempotency key.
            existing_job_id: Job ID associated with the key.
            correlation_id: Optional correlation ID for tracing.
        """
        super().__init__(
            f"Idempotency key {idempotency_key} already used for job {existing_job_id} "
            f"with different request fingerprint",
            correlation_id=correlation_id
        )
        self.idempotency_key = idempotency_key
        self.existing_job_id = existing_job_id


class StageAlreadyCompletedError(JobDomainError):
    """Stage has already been completed for this job."""

    def __init__(
        self,
        job_id: str,
        stage_name: str,
        correlation_id: Optional[str] = None,
    ) -> None:
        """Initialize stage already completed error.

        Args:
            job_id: The job ID.
            stage_name: The stage that is already completed.
            correlation_id: Optional correlation ID for tracing.
        """
        super().__init__(
            f"Stage {stage_name} already completed for job {job_id}",
            correlation_id=correlation_id,
        )
        self.job_id = job_id
        self.stage_name = stage_name


class UpstreamStageNotCompletedError(JobDomainError):
    """Required upstream stage has not completed."""

    def __init__(
        self,
        job_id: str,
        required_stage: str,
        actual_state: str,
        correlation_id: Optional[str] = None,
    ) -> None:
        """Initialize upstream stage not completed error.

        Args:
            job_id: The job ID.
            required_stage: The upstream stage that must be completed.
            actual_state: The actual state of the upstream stage.
            correlation_id: Optional correlation ID for tracing.
        """
        super().__init__(
            f"Upstream stage '{required_stage}' must be COMPLETED "
            f"(current state: {actual_state}) for job '{job_id}'",
            correlation_id=correlation_id,
        )
        self.job_id = job_id
        self.required_stage = required_stage
        self.actual_state = actual_state


class StageNotFoundError(JobDomainError):
    """Stage does not exist for the given job."""

    def __init__(
        self,
        job_id: str,
        stage_name: str,
        correlation_id: Optional[str] = None
    ) -> None:
        """Initialize stage not found error.

        Args:
            job_id: The job ID.
            stage_name: The stage name that was not found.
            correlation_id: Optional correlation ID for tracing.
        """
        super().__init__(
            f"Stage {stage_name} not found for job {job_id}",
            correlation_id=correlation_id
        )
        self.job_id = job_id
        self.stage_name = stage_name


================================================
FILE: build_stream/core/jobs/repositories.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Repository port interfaces (Protocols) for Jobs domain.

These define the contracts that infrastructure implementations must satisfy.
Using Protocol instead of ABC allows for structural subtyping (duck typing).
"""

from typing import Protocol, Optional, List
import uuid

from .entities import Job, Stage, IdempotencyRecord, AuditEvent
from .value_objects import JobId, IdempotencyKey, StageName


class JobIdGenerator(Protocol):
    """Generator port for creating Job identifiers."""

    def generate(self) -> JobId:
        """Generate a new Job identifier.

        Returns:
            A new, unique JobId.

        Raises:
            JobIdExhaustionError: If the generator cannot produce more IDs.
        """
        ...


class JobRepository(Protocol):
    """Repository port for Job aggregate persistence."""

    def save(self, job: Job) -> None:
        """Persist a job aggregate.

        Args:
            job: Job entity to persist.

        Raises:
            OptimisticLockError: If version conflict detected.
        """
        ...

    def find_by_id(self, job_id: JobId) -> Optional[Job]:
        """Retrieve a job by its identifier.

        Args:
            job_id: Unique job identifier.

        Returns:
            Job entity if found, None otherwise.
        """
        ...

    def exists(self, job_id: JobId) -> bool:
        """Check if a job exists.

        Args:
            job_id: Unique job identifier.

        Returns:
            True if job exists, False otherwise.
        """
        ...


class StageRepository(Protocol):
    """Repository port for Stage entity persistence."""

    def save(self, stage: Stage) -> None:
        """Persist a single stage.

        Args:
            stage: Stage entity to persist.

        Raises:
            OptimisticLockError: If version conflict detected.
        """
        ...

    def save_all(self, stages: List[Stage]) -> None:
        """Persist multiple stages atomically.

        Args:
            stages: List of stage entities to persist.

        Raises:
            OptimisticLockError: If version conflict detected.
        """
        ...

    def find_by_job_and_name(
        self,
        job_id: JobId,
        stage_name: StageName
    ) -> Optional[Stage]:
        """Retrieve a stage by job and stage name.

        Args:
            job_id: Parent job identifier.
            stage_name: Stage identifier.

        Returns:
            Stage entity if found, None otherwise.
        """
        ...

    def find_all_by_job(self, job_id: JobId) -> List[Stage]:
        """Retrieve all stages for a job.

        Args:
            job_id: Parent job identifier.

        Returns:
            List of stage entities (may be empty).
        """
        ...


class IdempotencyRepository(Protocol):
    """Repository port for IdempotencyRecord persistence."""

    def save(self, record: IdempotencyRecord) -> None:
        """Persist an idempotency record.

        Args:
            record: Idempotency record to persist.
        """
        ...

    def find_by_key(self, key: IdempotencyKey) -> Optional[IdempotencyRecord]:
        """Retrieve an idempotency record by key.

        Args:
            key: Idempotency key.

        Returns:
            IdempotencyRecord if found, None otherwise.
        """
        ...


class AuditEventRepository(Protocol):
    """Repository port for AuditEvent persistence."""

    def save(self, event: AuditEvent) -> None:
        """Persist an audit event.

        Args:
            event: Audit event to persist.
        """
        ...

    def find_by_job(self, job_id: JobId) -> List[AuditEvent]:
        """Retrieve all audit events for a job.

        Args:
            job_id: Job identifier.

        Returns:
            List of audit events (may be empty).
        """
        ...


class UUIDGenerator:
    """Interface for generating UUID objects."""

    def generate(self) -> uuid.UUID:
        """Generate a UUID object.

        Returns:
            uuid.UUID: A UUID object (v4 or v7 format).
        """
        ...


================================================
FILE: build_stream/core/jobs/services.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Domain services for Jobs domain."""

import hashlib
import json
import logging
from datetime import datetime, timezone
from typing import Any, Dict

from .entities import AuditEvent
from .repositories import JobRepository, AuditEventRepository, UUIDGenerator
from .value_objects import JobId, RequestFingerprint

logger = logging.getLogger(__name__)


class FingerprintService:
    """Domain service for computing request fingerprints.

    Computes deterministic SHA-256 hash of request payload for idempotency.
    """

    @staticmethod
    def compute(request_body: Dict[str, Any]) -> RequestFingerprint:
        """Compute SHA-256 fingerprint of request payload.

        Creates a deterministic hash by:
        1. Sorting keys alphabetically
        2. JSON serializing with no whitespace
        3. UTF-8 encoding
        4. SHA-256 hashing

        Args:
            request_body: Dictionary of request fields.

        Returns:
            RequestFingerprint value object.

        Example:
            >>> body = {"job_id": "123", "client_id": "abc"}
            >>> fp = FingerprintService.compute(body)
            >>> len(fp.value)
            64
        """
        normalized = json.dumps(request_body, sort_keys=True, separators=(',', ':'))
        digest = hashlib.sha256(normalized.encode('utf-8')).hexdigest()
        return RequestFingerprint(digest)


class JobStateHelper:
    """Static utility for centralized job state management.
    
    Provides methods to update job state when stages fail or complete,
    leveraging existing repository dependencies without requiring new services.
    """

    @staticmethod
    def handle_stage_failure(
        job_repo: JobRepository,
        audit_repo: AuditEventRepository,
        uuid_generator: UUIDGenerator,
        job_id: JobId,
        stage_name: str,
        error_code: str,
        error_summary: str,
        correlation_id: str,
        client_id: str,
    ) -> None:
        """Update job state to FAILED when a stage fails.
        
        This method:
        1. Retrieves the job
        2. Transitions job to FAILED state (if not already terminal)
        3. Saves the updated job
        4. Emits JOB_FAILED audit event
        5. Commits sessions if repositories have active sessions
        
        Args:
            job_repo: Job repository for loading/saving jobs.
            audit_repo: Audit repository for emitting events.
            uuid_generator: UUID generator for event IDs.
            job_id: Job identifier.
            stage_name: Name of the failed stage.
            error_code: Error code from stage failure.
            error_summary: Error summary from stage failure.
            correlation_id: Request correlation ID.
            client_id: Client identifier.
        """
        try:
            job = job_repo.find_by_id(job_id)
            if job is None:
                logger.warning(
                    "Job not found when handling stage failure: job_id=%s, stage=%s",
                    job_id, stage_name
                )
                return

            if job.job_state.is_terminal():
                logger.info(
                    "Job already in terminal state: job_id=%s, state=%s, stage=%s",
                    job_id, job.job_state.value, stage_name
                )
                return

            job.fail()
            job_repo.save(job)

            event = AuditEvent(
                event_id=str(uuid_generator.generate()),
                job_id=job_id,
                event_type="JOB_FAILED",
                correlation_id=correlation_id,
                client_id=client_id,
                timestamp=datetime.now(timezone.utc),
                details={
                    "failed_stage": stage_name,
                    "error_code": error_code,
                    "error_summary": error_summary,
                },
            )
            audit_repo.save(event)

            # Commit sessions if repositories have active sessions
            if hasattr(job_repo, 'session') and job_repo.session:
                job_repo.session.commit()
            if hasattr(audit_repo, 'session') and audit_repo.session:
                audit_repo.session.commit()

            logger.info(
                "Job marked as FAILED: job_id=%s, failed_stage=%s, error_code=%s",
                job_id, stage_name, error_code
            )

        except Exception as exc:
            logger.exception(
                "Failed to update job state on stage failure: job_id=%s, stage=%s",
                job_id, stage_name
            )

    @staticmethod
    def handle_job_completion(
        job_repo: JobRepository,
        audit_repo: AuditEventRepository,
        uuid_generator: UUIDGenerator,
        job_id: JobId,
        correlation_id: str,
        client_id: str,
    ) -> None:
        """Update job state to COMPLETED when final stage completes.
        
        This method:
        1. Retrieves the job
        2. Transitions job to COMPLETED state (if not already terminal)
        3. Saves the updated job
        4. Emits JOB_COMPLETED audit event
        5. Commits sessions if repositories have active sessions
        
        Args:
            job_repo: Job repository for loading/saving jobs.
            audit_repo: Audit repository for emitting events.
            uuid_generator: UUID generator for event IDs.
            job_id: Job identifier.
            correlation_id: Request correlation ID.
            client_id: Client identifier.
        """
        try:
            job = job_repo.find_by_id(job_id)
            if job is None:
                logger.warning(
                    "Job not found when handling completion: job_id=%s",
                    job_id
                )
                return

            if job.job_state.is_terminal():
                logger.info(
                    "Job already in terminal state: job_id=%s, state=%s",
                    job_id, job.job_state.value
                )
                return

            job.complete()
            job_repo.save(job)

            event = AuditEvent(
                event_id=str(uuid_generator.generate()),
                job_id=job_id,
                event_type="JOB_COMPLETED",
                correlation_id=correlation_id,
                client_id=client_id,
                timestamp=datetime.now(timezone.utc),
                details={
                    "completion_reason": "All stages completed successfully",
                },
            )
            audit_repo.save(event)

            # Commit sessions if repositories have active  sessions
            if hasattr(job_repo, 'session') and job_repo.session:
                job_repo.session.commit()
            if hasattr(audit_repo, 'session') and audit_repo.session:
                audit_repo.session.commit()

            logger.info(
                "Job marked as COMPLETED: job_id=%s",
                job_id
            )

        except Exception as exc:
            logger.exception(
                "Failed to update job state on completion: job_id=%s",
                job_id
            )


================================================
FILE: build_stream/core/jobs/value_objects.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Value objects for Job domain.

All value objects are immutable and defined by their values, not identity.
"""

import uuid
import re
from dataclasses import dataclass
from enum import Enum
from typing import ClassVar


@dataclass(frozen=True)
class JobId:
    """UUID identifier for a job.

    Attributes:
        value: String representation of UUID.

    Raises:
        ValueError: If value does not match UUID format or exceeds length.
    """

    value: str

    MAX_LENGTH: ClassVar[int] = 36  # UUID standard length

    def __post_init__(self) -> None:
        """Validate UUID format and length."""
        if len(self.value) > self.MAX_LENGTH:
            raise ValueError(
                f"JobId length cannot exceed {self.MAX_LENGTH} characters, "
                f"got {len(self.value)}"
            )
        try:
            uuid_obj = uuid.UUID(self.value)
        except Exception as exc:
            raise ValueError(f"Invalid UUID format: {self.value}") from exc
        # normalize representation
        object.__setattr__(self, "value", str(uuid_obj))

    def __str__(self) -> str:
        """Return string representation."""
        return self.value


@dataclass(frozen=True)
class CorrelationId:
    """UUID identifier for request tracing.

    Attributes:
        value: String representation of UUID.

    Raises:
        ValueError: If value does not match UUID format or exceeds length.
    """

    value: str

    MAX_LENGTH: ClassVar[int] = 36  # UUID standard length

    def __post_init__(self) -> None:
        """Validate UUID format and length."""
        if len(self.value) > self.MAX_LENGTH:
            raise ValueError(
                f"CorrelationId length cannot exceed {self.MAX_LENGTH} characters, "
                f"got {len(self.value)}"
            )
        try:
            uuid_obj = uuid.UUID(self.value)
        except Exception as exc:
            raise ValueError(f"Invalid UUID format: {self.value}") from exc
        object.__setattr__(self, "value", str(uuid_obj))

    def __str__(self) -> str:
        """Return string representation."""
        return self.value


class StageType(str, Enum):
    """Canonical stage types for BuildStreaM workflow.

    All valid stage identifiers in the closed set. Used by StageName VO
    for validation and by domain logic to avoid raw string comparisons.
    """

    PARSE_CATALOG = "parse-catalog"
    GENERATE_INPUT_FILES = "generate-input-files"
    CREATE_LOCAL_REPOSITORY = "create-local-repository"
    #CREATE_IMAGE_REPOSITORY = "create-image-repository"
    BUILD_IMAGE_X86_64 = "build-image-x86_64"
    BUILD_IMAGE_AARCH64 = "build-image-aarch64"
    VALIDATE_IMAGE_ON_TEST = "validate-image-on-test"
    #PROMOTE = "promote"


@dataclass(frozen=True)
class StageName:
    """Canonical stage identifier.

    Attributes:
        value: Stage name from canonical set.

    Raises:
        ValueError: If value is not in canonical stages set or exceeds length.
    """

    value: str

    MAX_LENGTH: ClassVar[int] = 30

    def __post_init__(self) -> None:
        """Validate stage name is in canonical set and length."""
        if len(self.value) > self.MAX_LENGTH:
            raise ValueError(
                f"StageName length cannot exceed {self.MAX_LENGTH} characters, "
                f"got {len(self.value)}"
            )
        try:
            StageType(self.value)
        except ValueError as exc:
            raise ValueError(
                f"Invalid stage name: {self.value}. "
                f"Must be one of: {sorted([stage.value for stage in StageType])}"
            ) from exc

    def as_enum(self) -> StageType:
        """Convert stage name to StageType enum.
        
        Returns:
            StageType: The corresponding enum value.
        """
        return StageType(self.value)

    def __str__(self) -> str:
        """Return string representation."""
        return self.value


@dataclass(frozen=True)
class IdempotencyKey:
    """Client-provided deduplication token.

    Attributes:
        value: Idempotency key string (1-255 characters).

    Raises:
        ValueError: If value length is invalid.
    """

    value: str

    MIN_LENGTH: ClassVar[int] = 1
    MAX_LENGTH: ClassVar[int] = 255

    def __post_init__(self) -> None:
        """Validate key length."""
        length = len(self.value)
        if length < self.MIN_LENGTH or length > self.MAX_LENGTH:
            raise ValueError(
                f"Idempotency key length must be between {self.MIN_LENGTH} "
                f"and {self.MAX_LENGTH} characters, got {length}"
            )

    def __str__(self) -> str:
        """Return string representation."""
        return self.value


@dataclass(frozen=True)
class RequestFingerprint:
    """SHA-256 hash of normalized request payload.

    Attributes:
        value: 64-character hex string (SHA-256 digest).

    Raises:
        ValueError: If value does not match SHA-256 pattern or exceeds length.
    """

    value: str

    SHA256_PATTERN: ClassVar[str] = r'^[0-9a-f]{64}$'
    MAX_LENGTH: ClassVar[int] = 64  # SHA-256 hex digest length

    def __post_init__(self) -> None:
        """Validate SHA-256 format and length."""
        if len(self.value) > self.MAX_LENGTH:
            raise ValueError(
                f"RequestFingerprint length cannot exceed {self.MAX_LENGTH} characters, "
                f"got {len(self.value)}"
            )
        if not re.match(self.SHA256_PATTERN, self.value.lower()):
            raise ValueError(
                f"Invalid SHA-256 format: {self.value}. "
                f"Expected 64 hexadecimal characters."
            )

    def __str__(self) -> str:
        """Return string representation."""
        return self.value


@dataclass(frozen=True)
class ClientId:
    """Client identity from authentication.

    Attributes:
        value: Client identifier string.

    Raises:
        ValueError: If value is empty or exceeds length.
    """

    value: str

    MAX_LENGTH: ClassVar[int] = 128  # Reasonable client ID length limit

    def __post_init__(self) -> None:
        """Validate client ID is not empty and within length limit."""
        if len(self.value) > self.MAX_LENGTH:
            raise ValueError(
                f"ClientId length cannot exceed {self.MAX_LENGTH} characters, "
                f"got {len(self.value)}"
            )
        if not self.value or not self.value.strip():
            raise ValueError("Client ID cannot be empty")

    def __str__(self) -> str:
        """Return string representation."""
        return self.value


class JobState(str, Enum):
    """Job lifecycle states.

    Terminal states (COMPLETED, FAILED, CANCELLED) cannot transition.
    """

    CREATED = "CREATED"
    IN_PROGRESS = "IN_PROGRESS"
    COMPLETED = "COMPLETED"
    FAILED = "FAILED"
    CANCELLED = "CANCELLED"

    def is_terminal(self) -> bool:
        """Check if state is terminal (immutable).

        Returns:
            True if state is COMPLETED, FAILED, or CANCELLED.
        """
        return self in {JobState.COMPLETED, JobState.FAILED, JobState.CANCELLED}


class StageState(str, Enum):
    """Stage execution states.

    Terminal states (COMPLETED, FAILED, SKIPPED, CANCELLED) cannot transition.
    """

    PENDING = "PENDING"
    IN_PROGRESS = "IN_PROGRESS"
    COMPLETED = "COMPLETED"
    FAILED = "FAILED"
    SKIPPED = "SKIPPED"
    CANCELLED = "CANCELLED"

    def is_terminal(self) -> bool:
        """Check if state is terminal (immutable).

        Returns:
            True if state is COMPLETED, FAILED, SKIPPED, or CANCELLED.
        """
        return self in {
            StageState.COMPLETED,
            StageState.FAILED,
            StageState.SKIPPED,
            StageState.CANCELLED,
        }


================================================
FILE: build_stream/core/localrepo/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Local repository domain module for Build Stream."""

from core.localrepo.entities import PlaybookRequest, PlaybookResult
from core.localrepo.exceptions import (
    InputDirectoryInvalidError,
    InputFilesMissingError,
    LocalRepoDomainError,
    QueueUnavailableError,
)
from core.localrepo.repositories import (
    InputDirectoryRepository,
    PlaybookQueueRequestRepository,
    PlaybookQueueResultRepository,
)
from core.localrepo.services import (
    InputFileService,
    PlaybookQueueRequestService,
    PlaybookQueueResultService,
)

__all__ = [
    "PlaybookRequest",
    "PlaybookResult",
    "InputDirectoryInvalidError",
    "InputFilesMissingError",
    "LocalRepoDomainError",
    "QueueUnavailableError",
    "InputDirectoryRepository",
    "PlaybookQueueRequestRepository",
    "PlaybookQueueResultRepository",
    "InputFileService",
    "PlaybookQueueRequestService",
    "PlaybookQueueResultService",
]


================================================
FILE: build_stream/core/localrepo/entities.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Domain entities for Local Repository module."""

from dataclasses import dataclass
from datetime import datetime, timezone
from typing import Any, Dict, Optional

from core.jobs.value_objects import CorrelationId, JobId

from core.localrepo.value_objects import ExecutionTimeout, ExtraVars, PlaybookPath


@dataclass(frozen=True)
class PlaybookRequest:
    """Immutable value object representing a playbook execution request.

    Written to the NFS playbook queue for OIM Core consumption.

    Attributes:
        job_id: Parent job identifier.
        stage_name: Stage identifier (create-local-repository).
        playbook_path: Validated path to the playbook.
        extra_vars: Ansible extra variables.
        correlation_id: Request tracing identifier.
        timeout: Execution timeout configuration.
        submitted_at: Request submission timestamp.
        request_id: Unique request identifier.
    """

    job_id: str
    stage_name: str
    playbook_path: PlaybookPath
    extra_vars: ExtraVars
    correlation_id: str
    timeout: ExecutionTimeout
    submitted_at: str
    request_id: str

    def to_dict(self) -> Dict[str, Any]:
        """Serialize request to dictionary for JSON file writing."""
        return {
            "job_id": self.job_id,
            "stage_name": self.stage_name,
            "playbook_path": str(self.playbook_path),
            "extra_vars": self.extra_vars.to_dict(),
            "correlation_id": self.correlation_id,
            "timeout_minutes": self.timeout.minutes,
            "submitted_at": self.submitted_at,
            "request_id": self.request_id,
        }

    def generate_filename(self) -> str:
        """Generate request file name following naming convention.

        Returns:
            Filename: {job_id}_{stage_name}_{timestamp}.json
        """
        timestamp = datetime.now(timezone.utc).strftime("%Y%m%d_%H%M%S")
        return f"{self.job_id}_{self.stage_name}_{timestamp}.json"


@dataclass(frozen=True)
class PlaybookResult:
    """Immutable value object representing a playbook execution result.

    Read from the NFS playbook queue results directory.

    Attributes:
        job_id: Parent job identifier.
        stage_name: Stage identifier.
        request_id: Original request identifier.
        status: Execution status (success or failed).
        exit_code: Process exit code.
        stdout: Captured standard output.
        stderr: Captured standard error.
        started_at: Execution start timestamp.
        completed_at: Execution completion timestamp.
        duration_seconds: Total execution duration.
        error_code: Error classification code (if failed).
        error_summary: Human-readable error description (if failed).
        timestamp: Result creation timestamp.
        log_file_path: Ansible log file path on OIM host (NFS share).
    """

    job_id: str
    stage_name: str
    request_id: str
    status: str
    exit_code: int
    stdout: str = ""
    stderr: str = ""
    started_at: str = ""
    completed_at: str = ""
    duration_seconds: int = 0
    error_code: Optional[str] = None
    error_summary: Optional[str] = None
    timestamp: str = ""
    log_file_path: Optional[str] = None

    @property
    def is_success(self) -> bool:
        """Check if execution was successful."""
        return self.status == "success"

    @property
    def is_failed(self) -> bool:
        """Check if execution failed."""
        return self.status == "failed"

    @staticmethod
    def from_dict(data: Dict[str, Any]) -> "PlaybookResult":
        """Deserialize result from dictionary (parsed from JSON file).

        Args:
            data: Dictionary parsed from result JSON file.

        Returns:
            PlaybookResult instance.

        Raises:
            KeyError: If required fields are missing.
            ValueError: If field values are invalid.
        """
        return PlaybookResult(
            job_id=data["job_id"],
            stage_name=data["stage_name"],
            request_id=data.get("request_id", ""),
            status=data["status"],
            exit_code=data.get("exit_code", -1),
            stdout=data.get("stdout", ""),
            stderr=data.get("stderr", ""),
            started_at=data.get("started_at", ""),
            completed_at=data.get("completed_at", ""),
            duration_seconds=data.get("duration_seconds", 0),
            error_code=data.get("error_code"),
            error_summary=data.get("error_summary"),
            timestamp=data.get("timestamp", ""),
            log_file_path=data.get("log_file_path"),
        )


================================================
FILE: build_stream/core/localrepo/exceptions.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Domain exceptions for Local Repository module."""

from typing import Optional


class LocalRepoDomainError(Exception):
    """Base exception for all local repo domain errors."""

    def __init__(self, message: str, correlation_id: Optional[str] = None) -> None:
        """Initialize domain error.

        Args:
            message: Human-readable error description.
            correlation_id: Optional correlation ID for tracing.
        """
        super().__init__(message)
        self.message = message
        self.correlation_id = correlation_id


class QueueUnavailableError(LocalRepoDomainError):
    """NFS playbook queue is not accessible."""

    def __init__(
        self,
        queue_path: str,
        reason: str = "",
        correlation_id: Optional[str] = None,
    ) -> None:
        """Initialize queue unavailable error.

        Args:
            queue_path: Path to the unavailable queue directory.
            reason: Reason the queue is unavailable.
            correlation_id: Optional correlation ID for tracing.
        """
        super().__init__(
            f"Playbook queue unavailable at {queue_path}: {reason}",
            correlation_id=correlation_id,
        )
        self.queue_path = queue_path
        self.reason = reason


class InputFilesMissingError(LocalRepoDomainError):
    """Required input files not found for job."""

    def __init__(
        self,
        job_id: str,
        input_path: str,
        correlation_id: Optional[str] = None,
    ) -> None:
        """Initialize input files missing error.

        Args:
            job_id: The job ID with missing input files.
            input_path: Expected input directory path.
            correlation_id: Optional correlation ID for tracing.
        """
        super().__init__(
            f"Input files not found for job {job_id} at {input_path}. "
            f"Run GenerateInputFiles API first.",
            correlation_id=correlation_id,
        )
        self.job_id = job_id
        self.input_path = input_path


class InputDirectoryInvalidError(LocalRepoDomainError):
    """Input directory structure is invalid."""

    def __init__(
        self,
        job_id: str,
        input_path: str,
        reason: str = "",
        correlation_id: Optional[str] = None,
    ) -> None:
        """Initialize input directory invalid error.

        Args:
            job_id: The job ID with invalid input directory.
            input_path: Path to the invalid input directory.
            reason: Reason the directory is invalid.
            correlation_id: Optional correlation ID for tracing.
        """
        super().__init__(
            f"Input directory invalid for job {job_id} at {input_path}: {reason}",
            correlation_id=correlation_id,
        )
        self.job_id = job_id
        self.input_path = input_path
        self.reason = reason


================================================
FILE: build_stream/core/localrepo/repositories.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Repository port interfaces (Protocols) for Local Repository domain.

These define the contracts that infrastructure implementations must satisfy.
Using Protocol instead of ABC allows for structural subtyping (duck typing).
"""

from pathlib import Path
from typing import List, Protocol

from core.localrepo.entities import PlaybookRequest, PlaybookResult


class PlaybookQueueRequestRepository(Protocol):
    """Repository port for writing playbook requests to the NFS queue."""

    def write_request(self, request: PlaybookRequest) -> Path:
        """Write a playbook request file to the requests directory.

        Args:
            request: Playbook request to write.

        Returns:
            Path to the written request file.

        Raises:
            QueueUnavailableError: If the queue directory is not accessible.
        """
        ...

    def is_available(self) -> bool:
        """Check if the request queue directory is accessible.

        Returns:
            True if the queue directory exists and is writable.
        """
        ...


class PlaybookQueueResultRepository(Protocol):
    """Repository port for reading playbook results from the NFS queue."""

    def get_unprocessed_results(self) -> List[Path]:
        """Return list of result files not yet processed.

        Returns:
            List of paths to unprocessed result JSON files.
        """
        ...

    def read_result(self, result_path: Path) -> PlaybookResult:
        """Read and parse a result file.

        Args:
            result_path: Path to the result JSON file.

        Returns:
            Parsed PlaybookResult entity.

        Raises:
            ValueError: If the result file is malformed.
        """
        ...

    def archive_result(self, result_path: Path) -> None:
        """Move a processed result file to the archive directory.

        Args:
            result_path: Path to the result file to archive.
        """
        ...

    def is_available(self) -> bool:
        """Check if the result queue directory is accessible.

        Returns:
            True if the queue directory exists and is readable.
        """
        ...


class InputDirectoryRepository(Protocol):
    """Repository port for managing input directory paths."""

    def get_source_input_repository_path(self, job_id: str) -> Path:
        """Get source input directory path for a job.

        Args:
            job_id: Job identifier.

        Returns:
            Path like <build_stream_root>/artifacts/{job_id}/input/
        """
        ...

    def get_destination_input_repository_path(self) -> Path:
        """Get destination input directory path expected by playbook.

        Returns:
            Path like /opt/omnia/input/project_build_stream/
        """
        ...

    def validate_input_directory(self, path: Path) -> bool:
        """Validate that input directory exists and contains required files.

        Args:
            path: Path to the input directory to validate.

        Returns:
            True if directory is valid and contains required files.
        """
        ...


================================================
FILE: build_stream/core/localrepo/services.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Domain services for Local Repository module."""

import logging
import shutil
from pathlib import Path
from typing import Callable

from api.logging_utils import log_secure_info

from core.localrepo.entities import PlaybookRequest, PlaybookResult
from core.localrepo.exceptions import (
    InputDirectoryInvalidError,
    InputFilesMissingError,
    QueueUnavailableError,
)
from core.localrepo.repositories import (
    InputDirectoryRepository,
    PlaybookQueueRequestRepository,
    PlaybookQueueResultRepository,
)

logger = logging.getLogger(__name__)


class InputFileService:
    """Service for validating and preparing input files before playbook execution.

    Ensures that required input files exist and are properly staged
    in the destination directory expected by the playbook.
    """

    def __init__(self, input_repo: InputDirectoryRepository) -> None:
        """Initialize input file service.

        Args:
            input_repo: Input directory repository implementation.
        """
        self._input_repo = input_repo

    def prepare_playbook_input(
        self,
        job_id: str,
        correlation_id: str = "",
    ) -> bool:
        """Prepare input files for playbook execution.

        Validates source input files exist, then copies them to the
        destination directory expected by the playbook.

        Args:
            job_id: Job identifier to prepare input for.
            correlation_id: Request correlation ID for tracing.

        Returns:
            True if input preparation was successful.

        Raises:
            InputFilesMissingError: If source input files not found.
            InputDirectoryInvalidError: If source directory is invalid.
        """
        source_path = self._input_repo.get_source_input_repository_path(job_id)
        destination_path = self._input_repo.get_destination_input_repository_path()

        if not self._input_repo.validate_input_directory(source_path):
            logger.error(
                "Input files not found for job %s at %s, correlation_id=%s",
                job_id,
                source_path,
                correlation_id,
            )
            raise InputFilesMissingError(
                job_id=job_id,
                input_path=str(source_path),
                correlation_id=correlation_id,
            )

        try:
            destination_path.mkdir(parents=True, exist_ok=True)
            
            # Copy software_config.json file if it exists
            software_config_file = source_path / "software_config.json"
            if software_config_file.is_file():
                dest_file = destination_path / "software_config.json"
                shutil.copy2(str(software_config_file), str(dest_file))
                logger.info("Copied software_config.json for job %s", job_id)
            
            # Copy config directory completely if it exists
            config_dir = source_path / "config"
            if config_dir.is_dir():
                dest_config_dir = destination_path / "config"
                shutil.copytree(str(config_dir), str(dest_config_dir), dirs_exist_ok=True)
                logger.info("Copied config directory for job %s", job_id)

            # Reset software.csv files for both architectures
            # (temporary fix to ensure new packages are downloaded when catalog changes)
            self._reset_software_csv_files()

            log_secure_info(
                "info",
                f"Input files prepared for job {job_id}",
                str(correlation_id),
            )
            return True

        except OSError as exc:
            log_secure_info(
                "error",
                f"Failed to prepare input files for job {job_id}",
                str(correlation_id),
            )
            raise InputDirectoryInvalidError(
                job_id=job_id,
                input_path=str(source_path),
                reason=str(exc),
                correlation_id=correlation_id,
            ) from exc

    def _reset_software_csv_files(self) -> None:
        """Reset software.csv files for both architectures.

        This is a temporary fix to ensure new packages are downloaded when the
        catalog changes. Eventually, the playbook should be modified to handle
        package-level status instead of relying on software.csv.

        Removes software.csv files at:
        - /opt/omnia/log/local_repo/x86_64/software.csv
        - /opt/omnia/log/local_repo/aarch64/software.csv

        Only attempts removal if parent directories exist.
        """
        architectures = ["x86_64", "aarch64"]
        base_path = Path("/opt/omnia/log/local_repo")

        for arch in architectures:
            software_csv_path = base_path / arch / "software.csv"

            # Check if parent directory exists before attempting removal
            if not software_csv_path.parent.exists():
                logger.debug(
                    "Parent directory does not exist for %s, skipping removal",
                    software_csv_path,
                )
                continue

            # Remove file if it exists
            if software_csv_path.exists():
                try:
                    software_csv_path.unlink()
                    logger.info(
                        "Reset software.csv for architecture %s at %s",
                        arch,
                        software_csv_path,
                    )
                except (PermissionError, FileNotFoundError, IsADirectoryError):
                    logger.warning(
                        "Failed to remove software.csv for architecture %s",
                        arch,
                    )
            else:
                logger.debug(
                    "software.csv does not exist for architecture %s at %s",
                    arch,
                    software_csv_path,
                )


class PlaybookQueueRequestService:
    """Service for managing playbook request queue operations.

    Handles writing playbook requests to the NFS shared volume
    for consumption by the OIM Core watcher service.
    """

    def __init__(self, request_repo: PlaybookQueueRequestRepository) -> None:
        """Initialize request queue service.

        Args:
            request_repo: Playbook queue request repository implementation.
        """
        self._request_repo = request_repo

    def submit_request(
        self,
        request: PlaybookRequest,
        correlation_id: str = "",
    ) -> Path:
        """Submit a playbook request to the NFS queue.

        Args:
            request: Playbook request to submit.
            correlation_id: Request correlation ID for tracing.

        Returns:
            Path to the written request file.

        Raises:
            QueueUnavailableError: If the queue is not accessible.
        """
        if not self._request_repo.is_available():
            raise QueueUnavailableError(
                queue_path="requests",
                reason="Request queue directory is not accessible",
                correlation_id=correlation_id,
            )

        request_path = self._request_repo.write_request(request)
        log_secure_info(
            "info",
            f"Request submitted for job {request.job_id}",
            str(request.correlation_id),
        )
        return request_path


class PlaybookQueueResultService:
    """Service for polling and processing playbook execution results.

    Monitors the NFS result queue and invokes callbacks when
    results are available.
    """

    def __init__(self, result_repo: PlaybookQueueResultRepository) -> None:
        """Initialize result queue service.

        Args:
            result_repo: Playbook queue result repository implementation.
        """
        self._result_repo = result_repo

    def poll_results(
        self,
        callback: Callable[[PlaybookResult], None],
    ) -> int:
        """Poll for new results and invoke callback for each.

        Args:
            callback: Function to call with each new result.

        Returns:
            Number of results processed.
        """
        if not self._result_repo.is_available():
            #logger.warning("Result queue directory is not accessible")
            return 0

        result_files = self._result_repo.get_unprocessed_results()
        processed_count = 0

        for result_path in result_files:
            try:
                result = self._result_repo.read_result(result_path)
                callback(result)
                self._result_repo.archive_result(result_path)
                processed_count += 1
                log_secure_info(
                    "info",
                    f"Processed result for job {result.job_id}",
                    str(result.request_id),
                )
            except (ValueError, KeyError) as exc:
                log_secure_info(
                    "error",
                    "Failed to parse result file",
                )
            except Exception as exc:  # pylint: disable=broad-except
                log_secure_info(
                    "error",
                    "Failed to process result file",
                )

        return processed_count


================================================
FILE: build_stream/core/localrepo/value_objects.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Value objects for Local Repository domain.

All value objects are immutable and defined by their values, not identity.
"""

import re
from dataclasses import dataclass
from typing import ClassVar, Dict, Any


@dataclass(frozen=True)
class PlaybookPath:
    """Validated playbook name for Ansible execution.

    Attributes:
        value: Playbook name (e.g., 'include_input_dir.yml') without path.
              The watcher service will map this to the full path internally.

    Raises:
        ValueError: If name is empty, invalid format, or contains traversal.
    """

    value: str

    MAX_LENGTH: ClassVar[int] = 128  # Reasonable limit for a filename
    ALLOWED_NAME_PATTERN: ClassVar[str] = r'^[a-zA-Z0-9_\-\.]+\.ya?ml$'

    def __post_init__(self) -> None:
        """Validate playbook name format and security."""
        if not self.value or not self.value.strip():
            raise ValueError("Playbook name cannot be empty")
            
        if len(self.value) > self.MAX_LENGTH:
            raise ValueError(
                f"Playbook name length cannot exceed {self.MAX_LENGTH} "
                f"characters, got {len(self.value)}"
            )
            
        if ".." in self.value:
            raise ValueError(
                f"Path traversal not allowed in playbook name: {self.value}"
            )
            
        if '/' in self.value:
            raise ValueError(
                f"Playbook name cannot contain path separators: {self.value}"
            )

        # Validate playbook name format
        if not re.match(self.ALLOWED_NAME_PATTERN, self.value):
            raise ValueError(
                f"Invalid playbook name format: {self.value}. "
                f"Must be a valid filename with .yml or .yaml extension."
            )

    def __str__(self) -> str:
        """Return string representation."""
        return self.value


@dataclass(frozen=True)
class ExtraVars:
    """Ansible extra variables container.

    Immutable container for ansible-playbook --extra-vars parameters.

    Attributes:
        values: Dictionary of extra variable key-value pairs.

    Raises:
        ValueError: If values is None or contains invalid keys.
    """

    values: Dict[str, Any]

    MAX_KEYS: ClassVar[int] = 50
    KEY_PATTERN: ClassVar[str] = r'^[a-zA-Z_][a-zA-Z0-9_]*$'

    def __post_init__(self) -> None:
        """Validate extra vars structure."""
        if self.values is None:
            raise ValueError("Extra vars cannot be None")
        if len(self.values) > self.MAX_KEYS:
            raise ValueError(
                f"Extra vars cannot exceed {self.MAX_KEYS} keys, "
                f"got {len(self.values)}"
            )
        for key in self.values:
            if not re.match(self.KEY_PATTERN, key):
                raise ValueError(
                    f"Invalid extra var key: {key}. "
                    f"Must match pattern: {self.KEY_PATTERN}"
                )

    def to_dict(self) -> Dict[str, Any]:
        """Return a copy of the extra vars dictionary."""
        return dict(self.values)

    def __str__(self) -> str:
        """Return string representation."""
        return str(self.values)


@dataclass(frozen=True)
class ExecutionTimeout:
    """Timeout configuration for playbook execution.

    Attributes:
        minutes: Timeout duration in minutes.

    Raises:
        ValueError: If minutes is not within valid range.
    """

    minutes: int

    MIN_MINUTES: ClassVar[int] = 1
    MAX_MINUTES: ClassVar[int] = 120
    DEFAULT_MINUTES: ClassVar[int] = 30

    def __post_init__(self) -> None:
        """Validate timeout range."""
        if not isinstance(self.minutes, int):
            raise ValueError(
                f"Timeout minutes must be an integer, got {type(self.minutes)}"
            )
        if self.minutes < self.MIN_MINUTES or self.minutes > self.MAX_MINUTES:
            raise ValueError(
                f"Timeout must be between {self.MIN_MINUTES} and "
                f"{self.MAX_MINUTES} minutes, got {self.minutes}"
            )

    @classmethod
    def default(cls) -> "ExecutionTimeout":
        """Create default timeout configuration."""
        return cls(minutes=cls.DEFAULT_MINUTES)

    def to_seconds(self) -> int:
        """Convert timeout to seconds."""
        return self.minutes * 60

    def __str__(self) -> str:
        """Return string representation."""
        return f"{self.minutes}m"


================================================
FILE: build_stream/core/utils/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


================================================
FILE: build_stream/core/validate/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""ValidateImageOnTest domain module.

This module contains domain logic for validate-image-on-test operations.
"""

from core.validate.entities import ValidateImageOnTestRequest
from core.validate.exceptions import (
    ValidateDomainError,
    EnvironmentUnavailableError,
    ValidationExecutionError,
)

__all__ = [
    "ValidateImageOnTestRequest",
    "ValidateDomainError",
    "EnvironmentUnavailableError",
    "ValidationExecutionError",
]


================================================
FILE: build_stream/core/validate/entities.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Domain entities for ValidateImageOnTest module."""

from dataclasses import dataclass
from datetime import datetime, timezone
from typing import Any, Dict

from core.localrepo.value_objects import ExecutionTimeout, ExtraVars, PlaybookPath


@dataclass(frozen=True)
class ValidateImageOnTestRequest:
    """Immutable entity representing a validate-image-on-test request.

    Written to the NFS queue for OIM Core consumption.
    Compatible with PlaybookRequest interface for reuse of existing repository.

    Attributes:
        job_id: Parent job identifier.
        stage_name: Stage identifier (validate-image-on-test).
        playbook_path: Validated path to the discovery playbook.
        extra_vars: Ansible extra variables (includes job_id).
        correlation_id: Request tracing identifier.
        timeout: Execution timeout configuration.
        submitted_at: Request submission timestamp.
        request_id: Unique request identifier.
    """

    job_id: str
    stage_name: str
    playbook_path: PlaybookPath
    extra_vars: ExtraVars
    correlation_id: str
    timeout: ExecutionTimeout
    submitted_at: str
    request_id: str

    def to_dict(self) -> Dict[str, Any]:
        """Serialize request to dictionary for JSON file writing."""
        return {
            "job_id": self.job_id,
            "stage_name": self.stage_name,
            "playbook_path": str(self.playbook_path),
            "extra_vars": self.extra_vars.to_dict(),
            "correlation_id": self.correlation_id,
            "timeout_minutes": self.timeout.minutes,
            "submitted_at": self.submitted_at,
            "request_id": self.request_id,
        }

    def generate_filename(self) -> str:
        """Generate request file name following naming convention.

        Returns:
            Filename: {job_id}_{stage_name}_{timestamp}.json
        """
        timestamp = datetime.now(timezone.utc).strftime("%Y%m%d_%H%M%S")
        return f"{self.job_id}_{self.stage_name}_{timestamp}.json"


================================================
FILE: build_stream/core/validate/exceptions.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""ValidateImageOnTest domain exceptions."""


class ValidateDomainError(Exception):
    """Base exception for validate-image-on-test domain errors."""

    def __init__(self, message: str, correlation_id: str = ""):
        """Initialize domain error.

        Args:
            message: Error message.
            correlation_id: Request correlation ID for tracing.
        """
        super().__init__(message)
        self.message = message
        self.correlation_id = correlation_id


class EnvironmentUnavailableError(ValidateDomainError):
    """Raised when test environment is not available for validation."""


class ValidationExecutionError(ValidateDomainError):
    """Raised when validation playbook execution fails."""


class StageGuardViolationError(ValidateDomainError):
    """Raised when required upstream stage has not completed."""


================================================
FILE: build_stream/core/validate/services.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Domain services for ValidateImageOnTest module."""

import logging

from core.jobs.value_objects import CorrelationId
from core.validate.entities import ValidateImageOnTestRequest

logger = logging.getLogger(__name__)


class ValidateQueueService:
    """Service for validate-image-on-test queue operations."""

    def __init__(self, queue_repo) -> None:
        """Initialize service with PlaybookQueueRequestRepository.

        Args:
            queue_repo: Playbook queue request repository implementation.
        """
        self._queue_repo = queue_repo

    def submit_request(
        self,
        request: ValidateImageOnTestRequest,
        correlation_id: CorrelationId,
    ) -> None:
        """Submit validate-image-on-test request to queue.

        Args:
            request: ValidateImageOnTestRequest to submit.
            correlation_id: Correlation ID for tracing.

        Raises:
            QueueUnavailableError: If queue is not accessible.
        """
        logger.info(
            "Submitting validate-image-on-test request to queue: "
            "job_id=%s, correlation_id=%s",
            request.job_id,
            correlation_id,
        )
        self._queue_repo.write_request(request)
        logger.info(
            "Validate-image-on-test request submitted successfully: "
            "job_id=%s, request_id=%s, correlation_id=%s",
            request.job_id,
            request.request_id,
            correlation_id,
        )


================================================
FILE: build_stream/doc/README.md
================================================
# Build Stream Documentation

This directory contains comprehensive documentation for the Build Stream module and its workflows.

## Documentation Structure

### Overview Documentation
- **[Developer Guide](./developer-guide.md)** - Complete development guide with architecture deep dive
- **[Main README](../README.md)** - High-level overview and getting started guide

### Workflow Documentation
- **[Jobs Management](./jobs.md)** - Job lifecycle and orchestration
- **[Catalog Processing](./catalog.md)** - Software catalog parsing and role generation
- **[Local Repository](./local_repo.md)** - Local package repository creation
- **[Image Building](./build_image.md)** - Container image build workflows
- **[Validation](./validation.md)** - Input and output validation

## Quick Navigation

### For New Contributors
1. Start with the [main README](../README.md) for architecture overview
2. Read the [Developer Guide](./developer-guide.md) for detailed understanding
3. Explore specific workflow documentation based on your area of focus

### For Debugging Issues
1. Check the relevant workflow documentation for your issue area
2. Use the Developer Guide for troubleshooting steps
3. Review the audit trail and logging sections

### For Feature Development
1. Read the Developer Guide for architecture and patterns
2. Review the relevant workflow documentation
3. Follow the contribution guidelines in the Developer Guide

## Documentation Standards

All Build Stream documentation follows these standards:
- **No sensitive data** - Never include passwords, tokens, or secrets
- **Developer-focused** - Written for technical contributors
- **Cross-referenced** - Links between related documentation
- **Example-driven** - Includes practical examples and code snippets
- **Maintainable** - Easy to update as the codebase evolves

## Getting Help

If you need additional help beyond the documentation:
1. Check the troubleshooting sections in workflow docs
2. Review the audit trail and error handling patterns
3. Consult the architecture diagrams in the Developer Guide
4. Reach out to the Build Stream development team

## Contributing to Documentation

When contributing to Build Stream:
1. Update relevant documentation for API changes
2. Add new workflow documentation for new features
3. Keep cross-references up to date
4. Follow the established documentation standards
5. Include examples and troubleshooting information


================================================
FILE: build_stream/doc/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


================================================
FILE: build_stream/doc/build_image.md
================================================
# OS Image Building

The OS Image Building workflow orchestrates operating system image creation for functional roles in the Omnia platform.

## What It Does

The OS Image Building workflow provides:
- OS image build orchestration for functional roles
- Multi-architecture OS image support (x86_64, aarch64)
- Package installation and configuration management

## Inputs/Outputs

**Inputs:**
- Catalog files defining functional roles and packages
- Generated input configuration files
- PXE mapping file for deployment configuration

**Outputs:**
- Built OS images for functional roles
- OS image metadata and manifests
- Package installation logs and validation reports
- OS image deployment configurations

## Key Logic Locations

**Primary Files:**
- `api/build_image/routes.py` - HTTP endpoints for OS build operations
- `orchestrator/build_image/use_cases/` - OS build orchestration logic
- `core/build_image/entities.py` - OS build domain entities
- `core/build_image/repositories.py` - OS build data access
- `core/build_image/services.py` - OS build management services

**Main Components:**
- **BuildOSImageUseCase** - Orchestrates OS image build processes for functional roles
- **OSService** - Manages OS build execution and monitoring
- **MultiArchOSBuilder** - Handles multi-architecture OS builds
- **PackageInstaller** - Manages package installation and configuration

## Workflow Flow

1. **Build Request**: Client submits image build request for functional roles
2. **OS Context Preparation**: Base functional role packages assembled
3. **Multi-Arch Setup**: OS build configurations prepared for target architectures
4. **Package Installation**: Functional role packages installed and configured
5. **OS Customization**: System settings and configurations applied
6. **Image Creation**: OS images built and optimized for deployment

## Architecture Support

Supports multiple CPU architectures:
- **x86_64** - Standard 64-bit Intel/AMD processors
- **aarch64** - 64-bit ARM processors


## Build Optimization

Optimizations include:
- **Package caching** - Reusing downloaded packages across builds
- **Parallel builds** - Concurrent building for multiple architectures
- **Dependency resolution** - Efficient package dependency management

## Security Features

Security capabilities include:
- **Package verification** - Automated package integrity validation
- **Base OS validation** - Verified base OS sources and configurations
- **Signature verification** - Package signature and checksum validation


## Integration Points

- Receives packages from local repository workflow
- Integrates with validation workflow for quality checks
- Uses Vault for secure credential management
- Connects with deployment systems for functional role provisioning

## Configuration

Build configuration includes:
- OS build parameters and environment variables
- Functional role specifications and requirements
- Package installation policies and configurations
- Architecture-specific OS settings

## Error Handling

- Detailed OS build error reporting
- Step-by-step build progress tracking
- Rollback capabilities for failed builds
- Automated retry for transient failures

## Monitoring

- Real-time OS build progress monitoring
- Resource usage tracking (CPU, memory, storage)
- Build success/failure metrics
- Package installation result tracking


================================================
FILE: build_stream/doc/catalog.md
================================================
# Catalog Processing

The Catalog workflow handles software catalog parsing and role generation for the Omnia platform.

## What It Does

The Catalog workflow provides:
- Software catalog parsing from JSON files
- Role generation based on catalog contents
- Package categorization and dependency resolution
- Integration with Ansible for role creation
- Validation of catalog structure and contents

## Inputs/Outputs

**Inputs:**
- Software catalog JSON files
- Package configuration mappings
- Role templates and definitions
- Platform-specific parameters

**Outputs:**
- Generated Ansible roles
- Package dependency mappings
- Validated catalog structures
- Role metadata and documentation

## Key Logic Locations

**Primary Files:**
- `api/catalog_roles/routes.py` - HTTP endpoints for catalog operations
- `api/parse_catalog/routes.py` - Catalog parsing endpoints
- `orchestrator/catalog/use_cases/parse_catalog.py` - Catalog parsing logic
- `orchestrator/catalog/use_cases/generate_input_files.py` - Input file generation

**Main Components:**
- **ParseCatalogUseCase** - Handles catalog parsing and validation
- **GenerateInputFilesUseCase** - Creates Ansible input files
- **CatalogRolesService** - Role generation and management
- **CatalogRepository** - Catalog data persistence

## Workflow Flow

1. **Catalog Upload**: Client submits catalog via `/api/v1/parse_catalog` endpoint
2. **Structure Validation**: Catalog schema and structure validated
3. **Package Parsing**: Individual packages extracted and categorized
4. **Dependency Resolution**: Package dependencies analyzed and resolved
5. **Role Generation**: Ansible roles generated based on packages
6. **Input File Creation**: Configuration files created for downstream workflows
7. **Validation**: Generated artifacts validated for completeness
8. **Storage**: Results stored in artifact repository

## Package Categorization

Packages are categorized into:
- **Base OS Bundles**: Operating system packages (e.g., rhel)
- **Driver Bundles**: Hardware driver packages (e.g., nvidia_gpu_driver)
- **Functional Bundles**: Core service packages (service_k8s, slurm_custom, additional_packages)
- **Infrastructure Bundles**: CSI and infrastructure packages (csi_driver_powerscale)
- **Miscellaneous**: Additional packages that don't fit other categories

## Integration Points

- Feeds into local repository creation workflow
- Provides input for image building workflows
- Integrates with validation workflow for quality checks
- Uses Vault for secure access to package repositories

## Configuration

Catalog processing is configured through:
- Package mapping files
- Adapter policy configurations
- Validation rules and schemas


================================================
FILE: build_stream/doc/jobs.md
================================================
# Jobs Management

The Jobs workflow manages the complete lifecycle of build jobs in Build Stream, from creation through completion and monitoring.

## What It Does

The Jobs workflow provides:
- Job creation with idempotency guarantees
- Stage-based execution with state management
- Job monitoring and status tracking

## Inputs/Outputs

**Inputs:**
- Job creation requests with stage definitions
- Authentication tokens for security
- Optional job parameters and configuration

**Outputs:**
- Job IDs for tracking
- Stage execution results
- Audit events for compliance
- Error details and diagnostics

## Key Logic Locations

**Primary Files:**
- `api/jobs/routes.py` - HTTP endpoints for job operations
- `orchestrator/jobs/use_cases/create_job.py` - Job creation business logic
- `core/jobs/entities.py` - Job and Stage domain entities
- `core/jobs/repositories.py` - Data access layer
- `core/jobs/services.py` - Job-related domain services

**Main Components:**
- **CreateJobUseCase** - Handles job creation with validation
- **JobRepository** - Manages job persistence
- **StageRepository** - Manages stage state tracking
- **ResultPoller** - Handles async result collection

## Workflow Flow

1. **Job Creation**: Client submits job via `/api/v1/jobs` endpoint
2. **Validation**: Request validated for authentication and schema
3. **Idempotency Check**: Prevents duplicate job creation
4. **Stage Initialization**: Job broken into executable stages
5. **Async Execution**: Stages queued for background processing
6. **Status Updates**: Job status tracked through state transitions
7. **Result Collection**: Results polled and stored
8. **Audit Logging**: All operations logged for traceability

## Prerequisites

To run jobs, the following infrastructure components are required:

- **PostgreSQL Database**: Used for persistent storage of job metadata and status
- **S3-compatible Object Storage**: Utilized for storing build artifacts, such as catalog files and build images  
- **Message Queue (e.g., RabbitMQ, Kafka)**: Enables asynchronous communication between job components and facilitates scalable processing
- **Container Runtime (e.g., Docker, containerd)**: Required for building and validating container images

These components must be properly configured and accessible to the BuildStreaM service for successful job execution.

## API Documentation

- See Omnia ReadTheDocs for complete API documentation
- Local development docs: `http://localhost:${PORT}/docs`
- Local ReDoc: `http://localhost:${PORT}/redoc`

## Stage Types

Jobs support multiple stages:
- **parse-catalog** - Software catalog processing
- **generate-input-files** - Input file generation
- **create-local-repository** - Local repository creation
- **build-image-x86_64** - x86_64 OS image building
- **build-image-aarch64** - aarch64 OS image building
- **validate-image-on-test** - Image validation testing

## Error Handling

- Invalid state transitions are rejected
- Comprehensive error reporting with context
- Audit trail captures all error events


================================================
FILE: build_stream/doc/local_repo.md
================================================
# Local Repository

The Local Repository workflow manages the creation and configuration of local package repositories for the Omnia platform.

## What It Does

The Local Repository workflow provides:
- Local package repository setup and configuration
- Package synchronization from remote sources
- Repository metadata generation and management
- Integration with Pulp for repository management
- Repository validation and health checking

## Inputs/Outputs

**Inputs:**
- Package lists from catalog processing
- Repository configuration parameters
- Remote repository URLs and credentials
- Storage and bandwidth constraints

**Outputs:**
- Configured local repositories
- Synchronized package metadata
- Repository access credentials
- Health check reports and validation results

## Key Logic Locations

**Primary Files:**
- `api/local_repo/routes.py` - HTTP endpoints for repository operations
- `orchestrator/local_repo/use_cases/create_local_repo.py` - Repository creation logic
- `core/localrepo/entities.py` - Repository domain entities
- `core/localrepo/repositories.py` - Repository data access
- `core/localrepo/services.py` - Repository management services

**Main Components:**
- **CreateLocalRepoUseCase** - Handles repository creation and setup
- **LocalRepoService** - Repository management and operations
- **LocalRepoRepository** - Repository configuration persistence
- **PackageSyncService** - Package synchronization from remote sources

## Workflow Flow

1. **Repository Request**: Client submits repository creation request
2. **Configuration Validation**: Repository parameters validated
3. **Remote Source Setup**: Remote repository connections configured
4. **Package Synchronization**: Packages synced from remote sources
5. **Metadata Generation**: Repository metadata created and updated
6. **Access Configuration**: User access and permissions configured
7. **Health Validation**: Repository health and accessibility validated
8. **Registration**: Repository registered with downstream systems

## Repository Types

Supports multiple repository types:
- **YUM/DNF repositories** - RPM-based package management
- **APT repositories** - Debian-based package management
- **Python repositories** - PyPI-compatible package hosting
- **Custom repositories** - Organization-specific package formats

## Integration Points

- Receives package lists from catalog workflow
- Provides packages to image building workflow
- Integrates with validation workflow for quality checks
- Uses Vault for secure credential storage
- Connects to Pulp for advanced repository management

## Configuration

Repository configuration includes:
- Storage locations and quotas
- Remote source URLs and credentials
- Synchronization schedules and policies
- Access control and permissions
- Health check parameters

## Security

- Secure credential management through Vault
- Access control based on user roles
- Package signature verification
- Audit logging for all repository operations

## Error Handling

- Graceful handling of remote source failures
- Retry mechanisms for synchronization errors
- Detailed error reporting and diagnostics
- Rollback capabilities for failed operations

## Monitoring

- Repository health status monitoring
- Package synchronization progress tracking
- Storage usage and quota monitoring
- Access logging and audit trails

## Performance Optimization

- Incremental synchronization to minimize bandwidth
- Parallel package downloading
- Caching of repository metadata
- Optimized storage layouts for fast access


================================================
FILE: build_stream/doc/validation.md
================================================
# Validation

The Validation workflow provides comprehensive validation for built images on provided testbeds specified in the PXE mapping file.

## What It Does

The Validation workflow provides:
- **validate_image_on_test** - Validates built images on testbeds
- Testbed deployment from PXE mapping file configuration
- Image boot testing and functionality validation
- Network connectivity and service validation
- Performance and resource utilization testing
- Compliance and security validation on target hardware

## Inputs/Outputs

**Inputs:**
- Built container images from Build Image workflow
- User-specified testbeds from catalog for validation
- PXE mapping file with testbed configurations
- Test validation criteria and test scripts
- Network and hardware specifications
- Expected service configurations

**Outputs:**
- Testbed deployment results and status
- Image boot validation reports
- Service functionality test results
- Performance metrics and benchmarks
- Error diagnostics and troubleshooting guides
- Compliance validation reports

## Key Logic Locations

**Primary Files:**
- `api/validate/routes.py` - HTTP endpoints for validation operations
- `orchestrator/validate/use_cases/` - Validation logic implementations
- `core/validate/entities.py` - Validation domain entities
- `core/validate/repositories.py` - Validation data access
- `core/validate/services.py` - Validation processing services

**Main Components:**
- **ValidateImageOnTestUseCase** - Orchestrates image validation on testbeds
- **PXEMappingParser** - Parses PXE mapping file for testbed configurations
- **TestbedDeployer** - Deploys images to testbeds via PXE
- **ImageBootValidator** - Validates image boot and startup
- **ServiceValidator** - Tests service functionality
- **PerformanceValidator** - Measures performance metrics
- **ComplianceValidator** - Checks compliance on target hardware

## Validation Types

**Image Boot Validation:**
- PXE boot configuration validation
- Image loading and initialization testing
- Kernel and initrd validation
- Boot sequence verification
- Hardware compatibility checking

**Service Validation:**
- Service startup and registration testing
- API endpoint accessibility validation
- Database connectivity verification
- Network service functionality testing
- Inter-service communication validation

**Performance Validation:**
- CPU and memory utilization testing
- Disk I/O and network throughput testing
- Response time and latency measurement
- Load testing and stress testing
- Resource optimization validation

**Compliance Validation:**
- Security policy validation on target hardware
- Regulatory compliance checking
- Configuration standard validation
- Access control verification
- Audit trail validation

## Workflow Flow

1. **Validation Request**: Client submits image validation request with specified testbeds from catalog
2. **PXE Mapping Parsing**: Testbed configurations extracted from PXE mapping file
3. **Testbed Configuration**: User-provided testbeds from catalog are configured for validation
4. **Image Deployment**: Container image deployed to specified testbeds via PXE
5. **Manual PXE Boot**: User runs `set_pxe_boot` utility to boot the images
6. **Boot Validation**: Image boot sequence validated and monitored
7. **Service Testing**: Deployed services tested for functionality
8. **Performance Testing**: Performance metrics collected and analyzed
9. **Compliance Checking**: Security and compliance validation performed
10. **Report Generation**: Comprehensive validation reports created
11. **Result Storage**: Validation results stored for audit trail
12. **Notification**: Validation status notifications sent

## Manual PXE Boot Step

After the `validate_image_on_test` API completes image deployment, users must manually run the `set_pxe_boot` utility from `omnia/utils/set_pxe_boot` to initiate the boot process:

**Required Action:**
```bash
# Run the set_pxe_boot utility from omnia/utils to boot deployed images
omnia/utils/set_pxe_boot --testbed <testbed_id> -i <image_name>
```

**Purpose:**
- Configures PXE boot settings for the deployed images
- Initiates the boot sequence on selected testbeds
- Enables monitoring and validation of the boot process
- Provides manual control over boot timing and test execution

**Parameters:**
- `--testbed`: Target testbed identifier from PXE mapping file
- `-i`: Image name to boot (from validation request)
- Optional: `--timeout`: Boot timeout duration
- Optional: `--debug`: Enable debug logging

**Integration Notes:**
- Must be run after `validate_image_on_test` API completes successfully
- Prepares testbeds for automated boot validation monitoring
- Enables subsequent boot validation, service testing, and performance measurement

## PXE Mapping Management

PXE mapping configuration includes:
- **Testbed Definitions** - Hardware specifications and capabilities
- **Network Configuration** - IP addresses and network settings
- **Boot Parameters** - Kernel parameters and boot options
- **Storage Configuration** - Disk layouts and mount points
- **Validation Criteria** - Test requirements and success criteria

## Security Validation

Security checks include:
- **Image Security Scanning** - Container image vulnerability analysis
- **Testbed Security** - Testbed access control and isolation
- **Network Security** - Network segmentation and firewall validation
- **Data Protection** - Sensitive data protection on testbeds
- **Compliance Checking** - Hardware and software compliance validation

## Quality Assurance

Quality metrics include:
- **Boot Reliability** - Image boot success rate and stability
- **Service Availability** - Service uptime and accessibility
- **Performance Metrics** - Response times and resource utilization
- **Hardware Compatibility** - Hardware driver compatibility and performance
- **Test Coverage** - Validation test completeness and effectiveness

## Integration Points

- Integrates with Build Image workflow for image validation
- Connects to PXE infrastructure for testbed deployment
- Integrates with monitoring systems for performance metrics
- Connects to testbed management systems for hardware control
- Links to compliance systems for regulatory validation

## Configuration

Validation configuration includes:
- PXE mapping file locations and formats
- User-specified testbeds from catalog for validation
- Validation test suites and test scripts
- Performance thresholds and benchmarks
- Compliance rules and security policies

## Error Handling

- Testbed deployment failure diagnostics
- Image boot error analysis and troubleshooting
- Service failure detection and recovery suggestions
- Performance issue identification and optimization recommendations
- Automated testbed recovery and retry mechanisms

## Reporting

Validation reports provide:
- Image validation status summary across testbeds
- Boot performance and reliability metrics
- Service functionality test results
- Performance benchmarks and comparisons
- Hardware compatibility assessment
- Security and compliance validation status
- Troubleshooting guides and recommendations

## Continuous Validation

Ongoing validation includes:
- Automated image testing on new builds
- Periodic testbed health and performance monitoring
- Continuous hardware compatibility validation
- Regular security and compliance checking
- Performance regression testing
- Testbed maintenance and optimization


================================================
FILE: build_stream/generate_catalog.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


#!/usr/bin/env python3
"""Generate updated catalog_rhel.json from input/config directory."""

import csv
import json
import os
import re
import argparse
from collections import defaultdict
from pathlib import Path


_FUNCTIONAL_BUNDLES = {
    "service_k8s",
    "slurm_custom",
    "additional_packages",
}

_MISC_BUNDLE = "additional_packages"


_INFRA_BUNDLES = {
    "csi_driver_powerscale",
}

def load_json(filepath):
    """Load and return JSON from the given file path."""
    with open(filepath, 'r', encoding='utf-8') as json_file:
        return json.load(json_file)


def _is_infra_package_name(pkg_name: str) -> bool:
    """Return True if a package name should be considered infrastructure (CSI-related)."""
    name = (pkg_name or "").lower()
    has_csi_token = re.search(r'(^|[^a-z0-9])csi([^a-z0-9]|$)', name) is not None
    has_csi_prefix = name.startswith('csi-') or '/csi-' in name or name.endswith('/csi')
    return (
        has_csi_token
        or has_csi_prefix
        or 'powerscale' in name
        or 'snapshotter' in name
        or 'helm-charts' in name
    )

def load_software_config(config_path):
    """Load software_config.json.

    Returns:
      - allowed_by_arch: {arch -> set(bundle_name)}
      - bundle_roles: {bundle_name -> list(role_name)}
      - versions_by_name: {bundle_name -> version_string}
    """
    config = load_json(config_path)

    allowed_by_arch = {
        'x86_64': set(),
        'aarch64': set(),
    }

    versions_by_name = {}

    for software in config.get('softwares', []):
        name = software.get('name')
        arches = software.get('arch', []) or []
        if not name:
            continue
        for arch in arches:
            if arch in allowed_by_arch:
                allowed_by_arch[arch].add(name)
        if software.get('version'):
            versions_by_name[name] = software.get('version')

    # bundle_roles is defined by top-level keys like "slurm_custom", "service_k8s", etc.
    # Each is a list of objects with {"name": "<role>"}.
    bundle_roles = {}
    for bundle_name, roles in config.items():
        if bundle_name in ['cluster_os_type', 'cluster_os_version', 'repo_config', 'softwares']:
            continue
        if not isinstance(roles, list):
            continue
        role_names = []
        for r in roles:
            if isinstance(r, dict) and r.get('name'):
                role_names.append(r['name'])
        if role_names:
            bundle_roles[bundle_name] = role_names

    return allowed_by_arch, bundle_roles, versions_by_name


def _extract_arch_from_pxe_group(pxe_group: str):
    """Extract architecture suffix from PXE functional group name."""
    if pxe_group.endswith('_x86_64'):
        return 'x86_64'
    if pxe_group.endswith('_aarch64'):
        return 'aarch64'
    return None

def load_pxe_functional_groups(pxe_file):
    """Load PXE mapping file and extract unique functional group names."""
    functional_groups = set()

    with open(pxe_file, 'r', encoding='utf-8') as csv_file:
        reader = csv.DictReader(csv_file)
        for row in reader:
            group_name = row.get('FUNCTIONAL_GROUP_NAME', '').strip()
            if group_name:
                functional_groups.add(group_name)

    return sorted(functional_groups)


def _append_unique_source(pkg_sources, source):
    """Append source only if an identical entry does not already exist."""
    if source not in pkg_sources:
        pkg_sources.append(source)

def _render_templated_url(template: str, bundle_name: str, versions_by_name: dict) -> str:
    """Render very simple Jinja-like templates used in config URLs.

    Supports patterns:
      - {{ <bundle>_version }}
      - {{ <bundle>_version.split('.')[:2] | join('.') }}
    """
    if not template or '{{' not in template:
        return template

    version = versions_by_name.get(bundle_name)
    if not version:
        return ''

    major_minor = '.'.join(version.split('.')[:2])

    # Replace the split/join pattern first
    pattern_mm = re.compile(r"\{\{\s*" + re.escape(bundle_name) + r"_version\.split\(\s*'\.'\s*\)\s*\[:2\]\s*\|\s*join\(\s*'\.'\s*\)\s*\}\}")
    rendered = pattern_mm.sub(major_minor, template)

    # Replace plain version token
    pattern_v = re.compile(r"\{\{\s*" + re.escape(bundle_name) + r"_version\s*\}\}")
    rendered = pattern_v.sub(version, rendered)

    # If anything templated remains, return empty to signal unresolved
    return '' if '{{' in rendered else rendered

def collect_packages_from_config(config_dir, allowed_bundles_by_arch, versions_by_name):
    """Collect all packages from config JSON files, filtered by allowed bundles per arch."""
    # pylint: disable=too-many-locals,too-many-branches,too-many-nested-blocks
    packages = defaultdict(lambda: {
        'name': None,
        'type': None,
        'architectures': set(),
        'sources': [],
        'tag': None,
        'url': None,
        'version': None,
        'bundles': set(),
    })

    for root, _dirs, files in os.walk(config_dir):
        for file in files:
            if not file.endswith('.json'):
                continue

            # Extract bundle name from filename (e.g., 'service_k8s.json' -> 'service_k8s')
            bundle_name = file.replace('.json', '')

            filepath = os.path.join(root, file)
            # Extract arch from path (e.g., x86_64 or aarch64)
            path_parts = Path(filepath).parts
            arch = None
            for part in path_parts:
                if part in ['x86_64', 'aarch64']:
                    arch = part
                    break

            if not arch:
                continue

            # Skip if this bundle is not allowed for this architecture
            if bundle_name not in allowed_bundles_by_arch.get(arch, set()):
                print(f"  Skipping {file} for arch {arch} (not in software_config.json)")
                continue

            data = load_json(filepath)

            # Process each section in the JSON
            for _section_name, section_data in data.items():
                if not isinstance(section_data, dict) or 'cluster' not in section_data:
                    continue

                for pkg in section_data['cluster']:
                    pkg_name = pkg['package']
                    pkg_type = pkg['type']

                    # Create unique key
                    key = f"{pkg_name}_{pkg_type}"

                    packages[key]['name'] = pkg_name
                    packages[key]['type'] = pkg_type
                    packages[key]['architectures'].add(arch)
                    packages[key]['bundles'].add(bundle_name)

                    # Handle different package types
                    if pkg_type in ['rpm', 'rpm_repo']:
                        repo_name = pkg.get('repo_name', '')
                        if repo_name:
                            _append_unique_source(
                                packages[key]['sources'],
                                {
                                    'Architecture': arch,
                                    'RepoName': repo_name
                                }
                            )
                    elif pkg_type in ['tarball', 'manifest', 'iso']:
                        url = pkg.get('url', '')
                        # Try to resolve templated URLs using versions from software_config
                        resolved_url = url
                        if url and '{{' in url:
                            resolved_url = _render_templated_url(url, bundle_name, versions_by_name)

                        if resolved_url:
                            _append_unique_source(
                                packages[key]['sources'],
                                {
                                    'Architecture': arch,
                                    'Uri': resolved_url
                                }
                            )
                        packages[key]['url'] = resolved_url or url
                        # Populate package version:
                        # - tarball: only for ucx/openmpi from software_config
                        # - iso: restore previous behavior to include Version from software_config when present
                        if pkg_type == 'tarball':
                            if (
                                pkg_name in ('ucx', 'openmpi')
                                and versions_by_name.get(bundle_name)
                            ):
                                packages[key]['version'] = versions_by_name[bundle_name]
                        elif pkg_type == 'iso':
                            if versions_by_name.get(bundle_name):
                                packages[key]['version'] = versions_by_name[bundle_name]
                    elif pkg_type == 'git':
                        url = pkg.get('url', '')
                        version = pkg.get('version', '')
                        packages[key]['url'] = url
                        packages[key]['version'] = version
                    elif pkg_type == 'image':
                        tag = pkg.get('tag', '')
                        packages[key]['tag'] = tag
                        packages[key]['version'] = tag

    return packages

def generate_catalog(input_dir, software_config_path, pxe_mapping_file):
    """Generate complete catalog structure."""
    # pylint: disable=too-many-locals,too-many-branches,too-many-nested-blocks

    # Load allowed software bundles from software_config.json
    allowed_bundles_by_arch, bundle_roles, versions_by_name = load_software_config(software_config_path)
    print("Allowed software bundles by arch: x86_64={}, aarch64={}".format(
        sorted(allowed_bundles_by_arch.get('x86_64', set())),
        sorted(allowed_bundles_by_arch.get('aarch64', set()))
    ))

    # Load PXE functional groups
    pxe_groups = load_pxe_functional_groups(pxe_mapping_file)
    print("PXE functional groups: {}".format(pxe_groups))

    packages = collect_packages_from_config(input_dir, allowed_bundles_by_arch, versions_by_name)

    # Convert sets to lists for JSON serialization
    for pkg_data in packages.values():
        pkg_data['architectures'] = sorted(list(pkg_data['architectures']))

    # Map packages to roles
    allowed_bundles = set().union(*allowed_bundles_by_arch.values())
    role_package_map, package_id_map = map_packages_to_roles(
        packages, input_dir, allowed_bundles, bundle_roles
    )
    print("Role to package mapping: {}".format(dict(role_package_map)))

    # Build catalog structure
    catalog = {
        "Catalog": {
            "Name": "Catalog",
            "Version": "1.0",
            "Identifier": "image-build",
            "FunctionalLayer": [],
            "BaseOS": [],
            "Infrastructure": [],
            "Drivers": [],
            "DriverPackages": {},
            "FunctionalPackages": {},
            "OSPackages": {},
            "Miscellaneous": [],
            "InfrastructurePackages": {}
        }
    }

    # Categorize packages using the package_id_map
    os_packages = {}
    functional_packages = {}
    infra_packages = {}
    misc_package_ids = []

    os_pkg_id_counter = 1
    infra_pkg_id_counter = 1

    for key, pkg_data in packages.items():
        pkg_name = pkg_data['name']
        bundles = set(pkg_data.get('bundles') or [])

        # Determine classification using bundle membership.
        # - Functional: service_k8s, slurm_custom, additional_packages
        # - Infrastructure: csi_driver_powerscale (plus name-based fallback)
        # - BaseOS: everything else
        is_functional = bool(bundles & _FUNCTIONAL_BUNDLES)
        is_infra = bool(bundles & _INFRA_BUNDLES) or _is_infra_package_name(pkg_name)
        is_misc = _MISC_BUNDLE in bundles

        if is_infra:
            pkg_id = f"infrastructure_package_id_{infra_pkg_id_counter}"
            infra_pkg_id_counter += 1
            infra_packages[pkg_id] = create_infra_package_entry(pkg_data)
            continue

        if is_functional:
            # Use the package_id from package_id_map
            if key in package_id_map:
                pkg_id = package_id_map[key]
                functional_packages[pkg_id] = create_package_entry(pkg_data)
                if is_misc:
                    misc_package_ids.append(pkg_id)
            continue

        pkg_id = f"os_package_id_{os_pkg_id_counter}"
        os_pkg_id_counter += 1
        os_packages[pkg_id] = create_package_entry(pkg_data)

    catalog["Catalog"]["FunctionalPackages"] = functional_packages
    catalog["Catalog"]["OSPackages"] = os_packages
    catalog["Catalog"]["Miscellaneous"] = sorted(list(set(misc_package_ids)))
    catalog["Catalog"]["InfrastructurePackages"] = infra_packages

    # Add BaseOS section
    catalog["Catalog"]["BaseOS"] = [{
        "Name": "RHEL",
        "Version": "10.0",
        "osPackages": sorted(os_packages.keys())
    }]

    # Add Infrastructure section
    if infra_packages:
        catalog["Catalog"]["Infrastructure"] = [{
            "Name": "csi",
            "InfrastructurePackages": sorted(infra_packages.keys())
        }]

    # Build Functional Layers based on PXE mapping
    catalog["Catalog"]["FunctionalLayer"] = build_functional_layers(
        functional_packages, pxe_groups, role_package_map
    )

    return catalog

def build_functional_layers(functional_packages, pxe_groups, role_package_map):
    """Build FunctionalLayer based on PXE functional groups and package mappings."""
    functional_layers = []

    # Map PXE functional groups to package roles
    for pxe_group in pxe_groups:
        # Extract role name from PXE group
        # (e.g., 'slurm_control_node_x86_64' -> 'slurm_control_node')
        # Remove architecture suffix
        role_name = pxe_group.replace('_x86_64', '').replace('_aarch64', '')

        # Find packages for this role.
        # Also merge in packages from the "<role>_first" section (e.g.,
        # service_kube_control_plane_first) which covers first-node-only items
        # like manifests and tarballs that are not present in the base section.
        package_ids = list(role_package_map.get(role_name, []))
        first_role = role_name + "_first"
        if first_role in role_package_map:
            package_ids = sorted(set(package_ids) | set(role_package_map[first_role]))

        # Filter package IDs by architecture encoded in PXE group name.
        pxe_arch = _extract_arch_from_pxe_group(pxe_group)
        if pxe_arch:
            package_ids = [
                pkg_id
                for pkg_id in package_ids
                if pkg_id in functional_packages
                and pxe_arch in functional_packages[pkg_id].get('Architecture', [])
            ]

        functional_layers.append({
            "Name": pxe_group,
            "FunctionalPackages": package_ids
        })

    return functional_layers

def map_packages_to_roles(packages, config_dir, allowed_bundles, bundle_roles):
    """Map packages to their roles based on which config section they appear in."""
    # pylint: disable=too-many-locals,too-many-branches,too-many-nested-blocks
    role_package_map = defaultdict(list)
    package_id_map = {}

    pkg_id_counter = 1

    # First pass: assign package IDs (only for functional bundles)
    for key, pkg_data in packages.items():
        pkg_name = pkg_data['name']
        bundles = set(pkg_data.get('bundles') or [])
        is_functional = bool(bundles & _FUNCTIONAL_BUNDLES)
        is_infra = bool(bundles & _INFRA_BUNDLES) or _is_infra_package_name(pkg_name)

        if is_functional and not is_infra:
            pkg_id = f"package_id_{pkg_id_counter}"
            pkg_id_counter += 1
            package_id_map[key] = pkg_id

    # Second pass: map packages to roles by scanning config files
    for root, _dirs, files in os.walk(config_dir):
        for file in files:
            if not file.endswith('.json'):
                continue

            bundle_name = file.replace('.json', '')
            if bundle_name not in allowed_bundles:
                continue

            # Only functional bundles should contribute to role-package mappings.
            if bundle_name not in _FUNCTIONAL_BUNDLES:
                continue

            filepath = os.path.join(root, file)
            data = load_json(filepath)

            # Process each section in the JSON
            for section_name, section_data in data.items():
                if not isinstance(section_data, dict) or 'cluster' not in section_data:
                    continue

                for pkg in section_data['cluster']:
                    pkg_name = pkg['package']
                    pkg_type = pkg['type']
                    key = f"{pkg_name}_{pkg_type}"

                    if key in package_id_map:
                        pkg_id = package_id_map[key]
                        # Map to role(s)
                        # 1) If the section name is a role (e.g., slurm_node), map directly.
                        # 2) If the section name is the bundle itself (bundle_name) or "cluster",
                        #    treat these as common packages and map to all roles declared for
                        #    that bundle in software_config.json.
                        if section_name not in ['cluster', bundle_name]:
                            role_package_map[section_name].append(pkg_id)
                        else:
                            for role in bundle_roles.get(bundle_name, []):
                                role_package_map[role].append(pkg_id)

    # Remove duplicates
    for role in role_package_map:
        role_package_map[role] = sorted(list(set(role_package_map[role])))

    return role_package_map, package_id_map

def create_package_entry(pkg_data):
    """Create a package entry for FunctionalPackages or OSPackages."""
    entry = {
        "Name": pkg_data['name'],
        "SupportedOS": [{"Name": "RHEL", "Version": "10.0"}],
        "Architecture": pkg_data['architectures'],
        "Type": pkg_data['type']
    }

    if pkg_data['tag']:
        entry["Tag"] = pkg_data['tag']
        entry["Version"] = pkg_data['tag']

    # For non-image packages, include a Version when known
    if pkg_data.get('version') and 'Version' not in entry and pkg_data['type'] != 'manifest':
        entry["Version"] = pkg_data['version']

    if pkg_data['sources']:
        entry["Sources"] = pkg_data['sources']

    return entry

def create_infra_package_entry(pkg_data):
    """Create an infrastructure package entry."""
    entry = {
        "Name": pkg_data['name'],
        "Type": pkg_data['type'],
        "Version": pkg_data.get('version'),
        "SupportedFunctions": [{"Name": "csi"}]
    }

    if pkg_data['architectures']:
        entry["Architecture"] = pkg_data['architectures']

    if pkg_data['tag']:
        entry["Tag"] = pkg_data['tag']

    # For git type packages, create Sources array with Uri
    if pkg_data['type'] == 'git' and pkg_data.get('url'):
        sources = []
        for arch in pkg_data['architectures']:
            sources.append({
                "Architecture": arch,
                "Uri": pkg_data['url']
            })
        entry["Sources"] = sources

    return entry

if __name__ == '__main__':
    parser = argparse.ArgumentParser(description='Generate catalog_rhel.json from input/config')
    parser.add_argument(
        '--base-dir',
        default='/opt/omnia/input/project_default/',
        help='Project base directory containing input/ and build_stream/ folders',
    )
    args = parser.parse_args()

    base_dir = args.base_dir
    if not os.path.exists(base_dir):
        repo_root = Path(__file__).resolve().parents[1]
        base_dir = str(repo_root)

    # Support base_dir as either repo root (contains input/ and build_stream/)
    # or the input directory itself.
    base_dir_path = Path(base_dir).resolve()
    is_input_dir = (base_dir_path / 'software_config.json').exists() and (base_dir_path / 'config').exists()

    if is_input_dir:
        input_dir = str(base_dir_path)
        repo_root = Path(__file__).resolve().parents[1]
    else:
        input_dir = str(base_dir_path / 'input')
        repo_root = base_dir_path

    input_config_dir = os.path.join(input_dir, 'config')
    software_config_file = os.path.join(input_dir, 'software_config.json')
    pxe_mapping_csv = os.path.join(input_dir, 'pxe_mapping_file.csv')
    output_file = os.path.join(
        str(repo_root),
        'build_stream',
        'core',
        'catalog',
        'test_fixtures',
        'catalog_rhel.json',
    )

    print("Generating catalog from input/config...")
    print(f"Using software config: {software_config_file}")
    print(f"Using PXE mapping: {pxe_mapping_csv}")
    generated_catalog = generate_catalog(input_config_dir, software_config_file, pxe_mapping_csv)

    print(f"\nWriting to {output_file}...")
    with open(output_file, 'w', encoding='utf-8') as out_file:
        json.dump(generated_catalog, out_file, indent=2)

    print("Done!")
    print("\nGenerated catalog with:")
    print(f"  - {len(generated_catalog['Catalog']['FunctionalPackages'])} functional packages")
    print(f"  - {len(generated_catalog['Catalog']['OSPackages'])} OS packages")
    print(
        f"  - {len(generated_catalog['Catalog']['InfrastructurePackages'])} infrastructure packages"
    )
    print(f"  - {len(generated_catalog['Catalog']['FunctionalLayer'])} functional layers")


================================================
FILE: build_stream/generate_catalog_examples.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

#!/usr/bin/env python3

import argparse
import json
import os
import shutil
from pathlib import Path

# Import sibling module generate_catalog.py in the same folder
# When executed as a script (python build_stream/generate_catalog_examples.py),
# sys.path[0] will be this folder, so a plain import works.
import generate_catalog as gen


def resolve_base_and_paths(base_dir_arg: str):
    base_dir = base_dir_arg
    if not os.path.exists(base_dir):
        repo_root = Path(__file__).resolve().parents[1]
        base_dir = str(repo_root)

    base_dir_path = Path(base_dir).resolve()

    # Support base_dir as either repo root (contains input/) or the input directory itself.
    is_input_dir = (
        (base_dir_path / 'software_config.json').exists()
        and (base_dir_path / 'config').exists()
    )

    if is_input_dir:
        input_dir = str(base_dir_path)
        repo_root = Path(__file__).resolve().parents[1]
    else:
        input_dir = str(base_dir_path / 'input')
        repo_root = base_dir_path

    return repo_root, Path(input_dir)


def copy_mapping_to_input(mapping_dir: Path, input_dir: Path):
    src_sw = mapping_dir / 'software_config.json'
    src_pxe = mapping_dir / 'pxe_mapping_file.csv'

    if not src_sw.exists() or not src_pxe.exists():
        raise FileNotFoundError(f"Mapping set missing files in {mapping_dir}")

    dst_sw = input_dir / 'software_config.json'
    dst_pxe = input_dir / 'pxe_mapping_file.csv'

    shutil.copyfile(src_sw, dst_sw)
    shutil.copyfile(src_pxe, dst_pxe)


def generate_example_catalogs(base_dir: str):
    repo_root, input_dir_path = resolve_base_and_paths(base_dir)

    examples_catalog_dir = repo_root / 'examples' / 'catalog'
    mapping_base = examples_catalog_dir / 'mapping_file_software_config'

    # Map output catalog files to their corresponding mapping folder names
    targets = {
        'catalog_rhel_aarch64_with_slurm_only.json': 'catalog_rhel_aarch64_with_slurm_only_json',
        'catalog_rhel_x86_64_with_slurm_only.json': 'catalog_rhel_x86_64_with_slurm_only_json',
        'catalog_rhel_with_ucx_openmpi.json': 'catalog_rhel_with_ucx_openmpi_json',
        'catalog_rhel.json': 'catalog_rhel_json',
    }

    # Ensure catalog_rhel.json is generated last
    generation_order = [
        'catalog_rhel_aarch64_with_slurm_only.json',
        'catalog_rhel_x86_64_with_slurm_only.json',
        'catalog_rhel_with_ucx_openmpi.json',
        'catalog_rhel.json',
    ]

    # Paths used by the generator
    input_config_dir = str(input_dir_path / 'config')
    software_config_file = str(input_dir_path / 'software_config.json')
    pxe_mapping_csv = str(input_dir_path / 'pxe_mapping_file.csv')

    results = []

    for out_name in generation_order:
        mapping_folder = targets[out_name]
        mapping_dir = mapping_base / mapping_folder
        print(f"\n==> Preparing mapping for {out_name} from {mapping_dir}")
        copy_mapping_to_input(mapping_dir, input_dir_path)

        print(
            f"Generating catalog using software_config={software_config_file} "
            f"and pxe_mapping={pxe_mapping_csv}"
        )
        catalog_obj = gen.generate_catalog(input_config_dir, software_config_file, pxe_mapping_csv)

        out_path = examples_catalog_dir / out_name
        print(f"Writing generated catalog to {out_path}")
        with open(out_path, 'w', encoding='utf-8') as f:
            json.dump(catalog_obj, f, indent=2)

        results.append({
            'output': str(out_path),
            'functional_packages': len(catalog_obj['Catalog']['FunctionalPackages']),
            'os_packages': len(catalog_obj['Catalog']['OSPackages']),
            'infra_packages': len(catalog_obj['Catalog']['InfrastructurePackages']),
            'functional_layers': len(catalog_obj['Catalog']['FunctionalLayer']),
        })

    print("\nSummary:")
    for r in results:
        print(
            f"  - {r['output']} => functional={r['functional_packages']}, "
            f"os={r['os_packages']}, infra={r['infra_packages']}, layers={r['functional_layers']}"
        )


def main():
    parser = argparse.ArgumentParser(
        description='Generate example catalogs by copying mapping/software_config into input/ and rendering catalogs.'
    )
    parser.add_argument(
        '--base-dir',
        default='/opt/omnia/input/project_default/',
        help='Project base directory containing input/ and build_stream/ folders, or the input/ directory itself.'
    )
    args = parser.parse_args()

    generate_example_catalogs(args.base_dir)


if __name__ == '__main__':
    main()


================================================
FILE: build_stream/infra/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


================================================
FILE: build_stream/infra/artifact_store/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Artifact store infrastructure implementations."""

from .in_memory_artifact_metadata import InMemoryArtifactMetadataRepository
from .in_memory_artifact_store import InMemoryArtifactStore
from .file_artifact_store import FileArtifactStore

__all__ = [
    "InMemoryArtifactStore",
    "InMemoryArtifactMetadataRepository",
    "FileArtifactStore",
]


================================================
FILE: build_stream/infra/artifact_store/file_artifact_store.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""File-based implementation of ArtifactStore for production use."""

import hashlib
import io
import shutil
import zipfile
from pathlib import Path
from typing import Dict, Optional, Set, Union

from core.artifacts.exceptions import (
    ArtifactAlreadyExistsError,
    ArtifactNotFoundError,
    ArtifactStoreError,
    ArtifactValidationError,
)
from core.artifacts.value_objects import (
    ArtifactDigest,
    ArtifactKey,
    ArtifactKind,
    ArtifactRef,
    StoreHint,
)


class FileArtifactStore:
    """File-based artifact store for production use.

    Stores artifacts on a local or network filesystem.
    Supports both FILE and ARCHIVE kinds via unified store/retrieve API.
    """

    DEFAULT_MAX_ARTIFACT_SIZE: int = 50 * 1024 * 1024  # 50 MB
    DEFAULT_ALLOWED_CONTENT_TYPES: Set[str] = {
        "application/json",
        "application/zip",
        "application/octet-stream",
        "text/plain",
    }

    def __init__(
        self,
        base_path: Path,
        max_artifact_size_bytes: int = DEFAULT_MAX_ARTIFACT_SIZE,
        allowed_content_types: Optional[Set[str]] = None,
    ) -> None:
        """Initialize file-based artifact store.

        Args:
            base_path: Base directory path for artifact storage.
            max_artifact_size_bytes: Maximum allowed artifact size.
            allowed_content_types: Set of allowed MIME content types.

        Raises:
            ValueError: If base_path is not a directory or not writable.
        """
        self._base_path = base_path
        self._max_artifact_size_bytes = max_artifact_size_bytes
        self._allowed_content_types = (
            allowed_content_types
            if allowed_content_types is not None
            else self.DEFAULT_ALLOWED_CONTENT_TYPES
        )

        self._base_path.mkdir(parents=True, exist_ok=True)
        if not self._base_path.is_dir():
            raise ValueError(f"base_path is not a directory: {base_path}")

    def store(
        self,
        hint: StoreHint,
        kind: ArtifactKind,
        content: Optional[bytes] = None,
        file_map: Optional[Dict[str, bytes]] = None,
        source_directory: Optional[Path] = None,
        content_type: str = "application/octet-stream",
    ) -> ArtifactRef:
        """Store an artifact (FILE or ARCHIVE).

        Args:
            hint: Hints for deterministic key generation.
            kind: FILE or ARCHIVE.
            content: Raw bytes (required for FILE kind).
            file_map: Mapping of relative paths to bytes (ARCHIVE kind).
            source_directory: Directory to zip (ARCHIVE kind).
            content_type: MIME type of the content.

        Returns:
            ArtifactRef with key, digest, size, and URI.

        Raises:
            ArtifactAlreadyExistsError: If artifact with same key exists.
            ArtifactValidationError: If content fails validation.
            ArtifactStoreError: If storage operation fails.
            ValueError: If wrong inputs for the given kind.
        """
        self._validate_content_type(content_type)
        raw_bytes = self._resolve_content(kind, content, file_map, source_directory)
        self._validate_size(raw_bytes)

        key = self.generate_key(hint, kind)
        artifact_path = self._get_artifact_path(key)

        if artifact_path.exists():
            raise ArtifactAlreadyExistsError(key=key.value)

        try:
            artifact_path.parent.mkdir(parents=True, exist_ok=True)
            artifact_path.write_bytes(raw_bytes)
        except OSError as e:
            raise ArtifactStoreError(
                f"Failed to write artifact to {artifact_path}: {e}"
            ) from e

        digest = ArtifactDigest(hashlib.sha256(raw_bytes).hexdigest())

        return ArtifactRef(
            key=key,
            digest=digest,
            size_bytes=len(raw_bytes),
            uri=f"file://{artifact_path}",
        )

    def retrieve(
        self,
        key: ArtifactKey,
        kind: ArtifactKind,
        destination: Optional[Path] = None,
    ) -> Union[bytes, Path]:
        """Retrieve an artifact.

        For FILE kind: returns bytes.
        For ARCHIVE kind: unpacks to destination and returns the path.

        Args:
            key: Artifact key to retrieve.
            kind: FILE or ARCHIVE.
            destination: Target directory for ARCHIVE unpacking.

        Returns:
            bytes for FILE kind, Path for ARCHIVE kind.

        Raises:
            ArtifactNotFoundError: If artifact does not exist.
            ArtifactStoreError: If retrieval fails.
        """
        artifact_path = self._get_artifact_path(key)

        if not artifact_path.exists():
            raise ArtifactNotFoundError(key=key.value)

        try:
            raw_bytes = artifact_path.read_bytes()
        except OSError as e:
            raise ArtifactStoreError(
                f"Failed to read artifact from {artifact_path}: {e}"
            ) from e

        if kind == ArtifactKind.FILE:
            return raw_bytes

        # ARCHIVE: unpack zip to destination
        if destination is None:
            import tempfile
            destination = Path(tempfile.mkdtemp(prefix="artifact-"))

        destination.mkdir(parents=True, exist_ok=True)

        try:
            with zipfile.ZipFile(io.BytesIO(raw_bytes), "r") as zf:
                zf.extractall(str(destination))
        except (zipfile.BadZipFile, OSError) as e:
            raise ArtifactStoreError(
                f"Failed to extract archive to {destination}: {e}"
            ) from e

        return destination

    def exists(self, key: ArtifactKey) -> bool:
        """Check if an artifact exists.

        Args:
            key: Artifact key to check.

        Returns:
            True if artifact exists, False otherwise.
        """
        artifact_path = self._get_artifact_path(key)
        return artifact_path.exists()

    def delete(self, key: ArtifactKey) -> bool:
        """Delete an artifact.

        Args:
            key: Artifact key to delete.

        Returns:
            True if artifact was deleted, False if not found.
        """
        artifact_path = self._get_artifact_path(key)
        if artifact_path.exists():
            try:
                artifact_path.unlink()
                self._cleanup_empty_dirs(artifact_path.parent)
                return True
            except OSError:
                return False
        return False

    def generate_key(self, hint: StoreHint, kind: ArtifactKind) -> ArtifactKey:
        """Generate a deterministic artifact key from hints.

        Key format: {namespace}/{tag_hash}/{label}.{ext}
        where tag_hash is a short SHA-256 of sorted tags for uniqueness.

        Args:
            hint: Store hints for key generation.
            kind: FILE or ARCHIVE (affects extension).

        Returns:
            Deterministic ArtifactKey.
        """
        tag_str = "|".join(
            f"{k}={v}" for k, v in sorted(hint.tags.items())
        )
        tag_hash = hashlib.sha256(tag_str.encode()).hexdigest()[:12]
        ext = "zip" if kind == ArtifactKind.ARCHIVE else "bin"
        key_value = f"{hint.namespace}/{tag_hash}/{hint.label}.{ext}"
        return ArtifactKey(key_value)

    def _get_artifact_path(self, key: ArtifactKey) -> Path:
        """Get the filesystem path for an artifact key.

        Args:
            key: Artifact key.

        Returns:
            Absolute path to the artifact file.
        """
        return self._base_path / key.value

    def _cleanup_empty_dirs(self, directory: Path) -> None:
        """Recursively remove empty parent directories up to base_path.

        Args:
            directory: Directory to start cleanup from.
        """
        try:
            while directory != self._base_path and directory.is_dir():
                if not any(directory.iterdir()):
                    directory.rmdir()
                    directory = directory.parent
                else:
                    break
        except OSError:
            pass

    def _resolve_content(
        self,
        kind: ArtifactKind,
        content: Optional[bytes],
        file_map: Optional[Dict[str, bytes]],
        source_directory: Optional[Path],
    ) -> bytes:
        """Resolve the raw bytes to store based on kind and inputs.

        Args:
            kind: FILE or ARCHIVE.
            content: Raw bytes for FILE kind.
            file_map: Dict of relative paths to bytes for ARCHIVE kind.
            source_directory: Directory to zip for ARCHIVE kind.

        Returns:
            Raw bytes to store.

        Raises:
            ValueError: If wrong combination of inputs for the given kind.
        """
        if kind == ArtifactKind.FILE:
            if content is None:
                raise ValueError(
                    "content is required for FILE kind"
                )
            if file_map is not None or source_directory is not None:
                raise ValueError(
                    "file_map and source_directory must not be provided for FILE kind"
                )
            return content

        # ARCHIVE kind
        if content is not None:
            raise ValueError(
                "content must not be provided for ARCHIVE kind; "
                "use file_map or source_directory"
            )
        if file_map is not None and source_directory is not None:
            raise ValueError(
                "Provide either file_map or source_directory, not both"
            )
        if file_map is None and source_directory is None:
            raise ValueError(
                "Either file_map or source_directory is required for ARCHIVE kind"
            )

        if file_map is not None:
            return self._zip_file_map(file_map)

        return self._zip_directory(source_directory)  # type: ignore[arg-type]

    def _zip_file_map(self, file_map: Dict[str, bytes]) -> bytes:
        """Create a zip archive from a file map.

        Args:
            file_map: Mapping of relative paths to content bytes.

        Returns:
            Zip archive as bytes.
        """
        buf = io.BytesIO()
        with zipfile.ZipFile(buf, "w", zipfile.ZIP_DEFLATED) as zf:
            for rel_path, data in sorted(file_map.items()):
                zf.writestr(rel_path, data)
        return buf.getvalue()

    def _zip_directory(self, directory: Path) -> bytes:
        """Create a zip archive from a directory.

        Args:
            directory: Directory to zip.

        Returns:
            Zip archive as bytes.

        Raises:
            ValueError: If directory does not exist.
        """
        if not directory.is_dir():
            raise ValueError(f"source_directory does not exist: {directory}")
        buf = io.BytesIO()
        with zipfile.ZipFile(buf, "w", zipfile.ZIP_DEFLATED) as zf:
            for file_path in sorted(directory.rglob("*")):
                if file_path.is_file():
                    rel_path = file_path.relative_to(directory)
                    zf.writestr(str(rel_path), file_path.read_bytes())
        return buf.getvalue()

    def _validate_content_type(self, content_type: str) -> None:
        """Validate content type against allowlist.

        Args:
            content_type: MIME content type.

        Raises:
            ArtifactValidationError: If content type not allowed.
        """
        if content_type not in self._allowed_content_types:
            raise ArtifactValidationError(
                f"Content type not allowed: {content_type}. "
                f"Allowed: {sorted(self._allowed_content_types)}"
            )

    def _validate_size(self, raw_bytes: bytes) -> None:
        """Validate artifact size against maximum.

        Args:
            raw_bytes: Content bytes.

        Raises:
            ArtifactValidationError: If content exceeds max size.
        """
        if len(raw_bytes) > self._max_artifact_size_bytes:
            raise ArtifactValidationError(
                f"Artifact size {len(raw_bytes)} bytes exceeds maximum "
                f"{self._max_artifact_size_bytes} bytes"
            )


================================================
FILE: build_stream/infra/artifact_store/in_memory_artifact_metadata.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""In-memory implementation of ArtifactMetadataRepository for dev/test."""

from typing import Dict, List, Optional, Tuple

from core.artifacts.entities import ArtifactRecord
from core.jobs.value_objects import JobId, StageName


class InMemoryArtifactMetadataRepository:
    """In-memory artifact metadata repository for development and testing.

    Stores ArtifactRecord instances in a dictionary keyed by
    (job_id, stage_name, label) triple for cross-stage lookup.
    """

    def __init__(self) -> None:
        """Initialize empty in-memory repository."""
        self._records: Dict[Tuple[str, str, str], ArtifactRecord] = {}

    def save(self, record: ArtifactRecord) -> None:
        """Persist an artifact metadata record.

        Args:
            record: ArtifactRecord to persist.
        """
        key = (
            str(record.job_id),
            str(record.stage_name),
            record.label,
        )
        self._records[key] = record

    def find_by_job_stage_and_label(
        self,
        job_id: JobId,
        stage_name: StageName,
        label: str,
    ) -> Optional[ArtifactRecord]:
        """Find an artifact record by job, stage, and label.

        Args:
            job_id: Parent job identifier.
            stage_name: Stage that produced the artifact.
            label: Artifact label.

        Returns:
            ArtifactRecord if found, None otherwise.
        """
        key = (str(job_id), str(stage_name), label)
        return self._records.get(key)

    def find_by_job(self, job_id: JobId) -> List[ArtifactRecord]:
        """Find all artifact records for a job.

        Args:
            job_id: Parent job identifier.

        Returns:
            List of ArtifactRecord (may be empty).
        """
        job_str = str(job_id)
        return [
            record
            for (j, _, _), record in self._records.items()
            if j == job_str
        ]

    def delete_by_job(self, job_id: JobId) -> int:
        """Delete all artifact records for a job.

        Args:
            job_id: Parent job identifier.

        Returns:
            Number of records deleted.
        """
        job_str = str(job_id)
        keys_to_delete = [
            key for key in self._records if key[0] == job_str
        ]
        for key in keys_to_delete:
            del self._records[key]
        return len(keys_to_delete)


================================================
FILE: build_stream/infra/artifact_store/in_memory_artifact_store.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""In-memory implementation of ArtifactStore for dev/test."""

import hashlib
import io
import tempfile
import zipfile
from pathlib import Path
from typing import Dict, Optional, Set, Union

from core.artifacts.exceptions import (
    ArtifactAlreadyExistsError,
    ArtifactNotFoundError,
    ArtifactStoreError,
    ArtifactValidationError,
)
from core.artifacts.value_objects import (
    ArtifactDigest,
    ArtifactKey,
    ArtifactKind,
    ArtifactRef,
    StoreHint,
)


class InMemoryArtifactStore:
    """In-memory artifact store for development and testing.

    Stores artifact content in a dictionary keyed by ArtifactKey.
    Supports both FILE and ARCHIVE kinds via unified store/retrieve API.
    """

    DEFAULT_MAX_ARTIFACT_SIZE: int = 50 * 1024 * 1024  # 50 MB
    DEFAULT_ALLOWED_CONTENT_TYPES: Set[str] = {
        "application/json",
        "application/zip",
        "application/octet-stream",
        "text/plain",
    }

    def __init__(
        self,
        max_artifact_size_bytes: int = DEFAULT_MAX_ARTIFACT_SIZE,
        allowed_content_types: Optional[Set[str]] = None,
    ) -> None:
        """Initialize in-memory artifact store.

        Args:
            max_artifact_size_bytes: Maximum allowed artifact size.
            allowed_content_types: Set of allowed MIME content types.
        """
        self._storage: Dict[str, bytes] = {}
        self._max_artifact_size_bytes = max_artifact_size_bytes
        self._allowed_content_types = (
            allowed_content_types
            if allowed_content_types is not None
            else self.DEFAULT_ALLOWED_CONTENT_TYPES
        )

    def store(
        self,
        hint: StoreHint,
        kind: ArtifactKind,
        content: Optional[bytes] = None,
        file_map: Optional[Dict[str, bytes]] = None,
        source_directory: Optional[Path] = None,
        content_type: str = "application/octet-stream",
    ) -> ArtifactRef:
        """Store an artifact (FILE or ARCHIVE).

        Args:
            hint: Hints for deterministic key generation.
            kind: FILE or ARCHIVE.
            content: Raw bytes (required for FILE kind).
            file_map: Mapping of relative paths to bytes (ARCHIVE kind).
            source_directory: Directory to zip (ARCHIVE kind).
            content_type: MIME type of the content.

        Returns:
            ArtifactRef with key, digest, size, and URI.

        Raises:
            ArtifactAlreadyExistsError: If artifact with same key exists.
            ArtifactValidationError: If content fails validation.
            ValueError: If wrong inputs for the given kind.
        """
        self._validate_content_type(content_type)
        raw_bytes = self._resolve_content(kind, content, file_map, source_directory)
        self._validate_size(raw_bytes)

        key = self.generate_key(hint, kind)

        if key.value in self._storage:
            raise ArtifactAlreadyExistsError(key=key.value)

        self._storage[key.value] = raw_bytes
        digest = ArtifactDigest(hashlib.sha256(raw_bytes).hexdigest())

        return ArtifactRef(
            key=key,
            digest=digest,
            size_bytes=len(raw_bytes),
            uri=f"memory://{key.value}",
        )

    def retrieve(
        self,
        key: ArtifactKey,
        kind: ArtifactKind,
        destination: Optional[Path] = None,
    ) -> Union[bytes, Path]:
        """Retrieve an artifact.

        For FILE kind: returns bytes.
        For ARCHIVE kind: unpacks to destination and returns the path.

        Args:
            key: Artifact key to retrieve.
            kind: FILE or ARCHIVE.
            destination: Target directory for ARCHIVE unpacking.

        Returns:
            bytes for FILE kind, Path for ARCHIVE kind.

        Raises:
            ArtifactNotFoundError: If artifact does not exist.
        """
        if key.value not in self._storage:
            raise ArtifactNotFoundError(key=key.value)

        raw_bytes = self._storage[key.value]

        if kind == ArtifactKind.FILE:
            return raw_bytes

        # ARCHIVE: unpack zip to destination
        if destination is None:
            destination = Path(tempfile.mkdtemp(prefix="artifact-"))

        destination.mkdir(parents=True, exist_ok=True)

        with zipfile.ZipFile(io.BytesIO(raw_bytes), "r") as zf:
            zf.extractall(str(destination))

        return destination

    def exists(self, key: ArtifactKey) -> bool:
        """Check if an artifact exists.

        Args:
            key: Artifact key to check.

        Returns:
            True if artifact exists, False otherwise.
        """
        return key.value in self._storage

    def delete(self, key: ArtifactKey) -> bool:
        """Delete an artifact.

        Args:
            key: Artifact key to delete.

        Returns:
            True if artifact was deleted, False if not found.
        """
        if key.value in self._storage:
            del self._storage[key.value]
            return True
        return False

    def generate_key(self, hint: StoreHint, kind: ArtifactKind) -> ArtifactKey:
        """Generate a deterministic artifact key from hints.

        Key format: {namespace}/{tag_hash}/{label}.{ext}
        where tag_hash is a short SHA-256 of sorted tags for uniqueness.

        Args:
            hint: Store hints for key generation.
            kind: FILE or ARCHIVE (affects extension).

        Returns:
            Deterministic ArtifactKey.
        """
        tag_str = "|".join(
            f"{k}={v}" for k, v in sorted(hint.tags.items())
        )
        tag_hash = hashlib.sha256(tag_str.encode()).hexdigest()[:12]
        ext = "zip" if kind == ArtifactKind.ARCHIVE else "bin"
        key_value = f"{hint.namespace}/{tag_hash}/{hint.label}.{ext}"
        return ArtifactKey(key_value)

    def _resolve_content(
        self,
        kind: ArtifactKind,
        content: Optional[bytes],
        file_map: Optional[Dict[str, bytes]],
        source_directory: Optional[Path],
    ) -> bytes:
        """Resolve the raw bytes to store based on kind and inputs.

        Args:
            kind: FILE or ARCHIVE.
            content: Raw bytes for FILE kind.
            file_map: Dict of relative paths to bytes for ARCHIVE kind.
            source_directory: Directory to zip for ARCHIVE kind.

        Returns:
            Raw bytes to store.

        Raises:
            ValueError: If wrong combination of inputs for the given kind.
        """
        if kind == ArtifactKind.FILE:
            if content is None:
                raise ValueError(
                    "content is required for FILE kind"
                )
            if file_map is not None or source_directory is not None:
                raise ValueError(
                    "file_map and source_directory must not be provided for FILE kind"
                )
            return content

        # ARCHIVE kind
        if content is not None:
            raise ValueError(
                "content must not be provided for ARCHIVE kind; "
                "use file_map or source_directory"
            )
        if file_map is not None and source_directory is not None:
            raise ValueError(
                "Provide either file_map or source_directory, not both"
            )
        if file_map is None and source_directory is None:
            raise ValueError(
                "Either file_map or source_directory is required for ARCHIVE kind"
            )

        if file_map is not None:
            return self._zip_file_map(file_map)

        return self._zip_directory(source_directory)  # type: ignore[arg-type]

    def _zip_file_map(self, file_map: Dict[str, bytes]) -> bytes:
        """Create a zip archive from a file map.

        Args:
            file_map: Mapping of relative paths to content bytes.

        Returns:
            Zip archive as bytes.
        """
        buf = io.BytesIO()
        with zipfile.ZipFile(buf, "w", zipfile.ZIP_DEFLATED) as zf:
            for rel_path, data in sorted(file_map.items()):
                zf.writestr(rel_path, data)
        return buf.getvalue()

    def _zip_directory(self, directory: Path) -> bytes:
        """Create a zip archive from a directory.

        Args:
            directory: Directory to zip.

        Returns:
            Zip archive as bytes.

        Raises:
            ValueError: If directory does not exist.
        """
        if not directory.is_dir():
            raise ValueError(f"source_directory does not exist: {directory}")
        buf = io.BytesIO()
        with zipfile.ZipFile(buf, "w", zipfile.ZIP_DEFLATED) as zf:
            for file_path in sorted(directory.rglob("*")):
                if file_path.is_file():
                    rel_path = file_path.relative_to(directory)
                    zf.writestr(str(rel_path), file_path.read_bytes())
        return buf.getvalue()

    def _validate_content_type(self, content_type: str) -> None:
        """Validate content type against allowlist.

        Args:
            content_type: MIME content type.

        Raises:
            ArtifactValidationError: If content type not allowed.
        """
        if content_type not in self._allowed_content_types:
            raise ArtifactValidationError(
                f"Content type not allowed: {content_type}. "
                f"Allowed: {sorted(self._allowed_content_types)}"
            )

    def _validate_size(self, raw_bytes: bytes) -> None:
        """Validate artifact size against maximum.

        Args:
            raw_bytes: Content bytes.

        Raises:
            ArtifactValidationError: If content exceeds max size.
        """
        if len(raw_bytes) > self._max_artifact_size_bytes:
            raise ArtifactValidationError(
                f"Artifact size {len(raw_bytes)} bytes exceeds maximum "
                f"{self._max_artifact_size_bytes} bytes"
            )


================================================
FILE: build_stream/infra/db/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Database infrastructure package.

Provides ORM models, mappers, SQL repository implementations,
and session management for PostgreSQL persistence.
"""

from .models import Base, JobModel, StageModel, IdempotencyKeyModel, AuditEventModel, ArtifactMetadata
from .mappers import JobMapper, StageMapper, IdempotencyRecordMapper, AuditEventMapper
from .repositories import (
    SqlJobRepository,
    SqlStageRepository,
    SqlIdempotencyRepository,
    SqlAuditEventRepository,
    SqlArtifactMetadataRepository,
)
from .session import get_db_session, get_db, SessionLocal

__all__ = [
    "Base",
    "JobModel",
    "StageModel",
    "IdempotencyKeyModel",
    "AuditEventModel",
    "ArtifactMetadata",
    "JobMapper",
    "StageMapper",
    "IdempotencyRecordMapper",
    "AuditEventMapper",
    "SqlJobRepository",
    "SqlStageRepository",
    "SqlIdempotencyRepository",
    "SqlAuditEventRepository",
    "SqlArtifactMetadataRepository",
    "get_db_session",
    "get_db",
    "SessionLocal",
]


================================================
FILE: build_stream/infra/db/alembic/env.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Alembic environment configuration."""

import os
import sys
from logging.config import fileConfig

from alembic import context
from sqlalchemy import engine_from_config, pool

# Add build_stream root to sys.path so models can be imported
sys.path.insert(0, os.path.abspath(os.path.join(os.path.dirname(__file__), "..", "..", "..")))

from infra.db.models import Base  # noqa: E402

config = context.config

# Override sqlalchemy.url from environment variable if available
database_url = os.getenv("DATABASE_URL")
if database_url:
    config.set_main_option("sqlalchemy.url", database_url)

if config.config_file_name is not None:
    fileConfig(config.config_file_name)

target_metadata = Base.metadata


def run_migrations_offline() -> None:
    """Run migrations in 'offline' mode.

    Configures the context with just a URL and not an Engine.
    Calls to context.execute() emit the given string to the script output.
    """
    url = config.get_main_option("sqlalchemy.url")
    context.configure(
        url=url,
        target_metadata=target_metadata,
        literal_binds=True,
        dialect_opts={"paramstyle": "named"},
    )

    with context.begin_transaction():
        context.run_migrations()


def run_migrations_online() -> None:
    """Run migrations in 'online' mode.

    Creates an Engine and associates a connection with the context.
    """
    connectable = engine_from_config(
        config.get_section(config.config_ini_section, {}),
        prefix="sqlalchemy.",
        poolclass=pool.NullPool,
    )

    with connectable.connect() as connection:
        context.configure(
            connection=connection,
            target_metadata=target_metadata,
        )

        with context.begin_transaction():
            context.run_migrations()


if context.is_offline_mode():
    run_migrations_offline()
else:
    run_migrations_online()


================================================
FILE: build_stream/infra/db/alembic/script.py.mako
================================================
"""${message}

Revision ID: ${up_revision}
Revises: ${down_revision | comma,n}
Create Date: ${create_date}

"""
from typing import Sequence, Union

from alembic import op
import sqlalchemy as sa
${imports if imports else ""}

# revision identifiers, used by Alembic.
revision: str = ${repr(up_revision)}
down_revision: Union[str, None] = ${repr(down_revision)}
branch_labels: Union[str, Sequence[str], None] = ${repr(branch_labels)}
depends_on: Union[str, Sequence[str], None] = ${repr(depends_on)}


def upgrade() -> None:
    ${upgrades if upgrades else "pass"}


def downgrade() -> None:
    ${downgrades if downgrades else "pass"}


================================================
FILE: build_stream/infra/db/alembic/versions/20260219_001_create_jobs_table.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

"""Create jobs table

Revision ID: 001
Revises: 
Create Date: 2026-02-19

"""
from typing import Sequence, Union

from alembic import op
import sqlalchemy as sa


# revision identifiers, used by Alembic.
revision: str = "001"
down_revision: Union[str, None] = None
branch_labels: Union[str, Sequence[str], None] = None
depends_on: Union[str, Sequence[str], None] = None


def upgrade() -> None:
    op.create_table(
        "jobs",
        sa.Column("job_id", sa.String(36), primary_key=True, nullable=False),
        sa.Column("client_id", sa.String(128), nullable=False),
        sa.Column("request_client_id", sa.String(128), nullable=False),
        sa.Column("client_name", sa.String(256), nullable=True),
        sa.Column("job_state", sa.String(20), nullable=False),
        sa.Column("created_at", sa.DateTime(timezone=True), nullable=False),
        sa.Column("updated_at", sa.DateTime(timezone=True), nullable=False),
        sa.Column("version", sa.Integer, nullable=False, server_default="1"),
        sa.Column("tombstoned", sa.Boolean, nullable=False, server_default="false"),
        sa.CheckConstraint(
            "job_state IN ('CREATED', 'IN_PROGRESS', 'COMPLETED', 'FAILED', 'CANCELLED')",
            name="ck_job_state",
        ),
    )

    op.create_index("ix_jobs_client_id", "jobs", ["client_id"])
    op.create_index("ix_jobs_job_state", "jobs", ["job_state"])
    op.create_index("ix_jobs_created_at", "jobs", ["created_at"])
    op.create_index("ix_jobs_client_created", "jobs", ["client_id", "created_at"])


def downgrade() -> None:
    op.drop_index("ix_jobs_client_created", table_name="jobs")
    op.drop_index("ix_jobs_created_at", table_name="jobs")
    op.drop_index("ix_jobs_job_state", table_name="jobs")
    op.drop_index("ix_jobs_client_id", table_name="jobs")
    op.drop_table("jobs")


================================================
FILE: build_stream/infra/db/alembic/versions/20260219_002_create_stages_table.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

"""Create job_stages table

Revision ID: 002
Revises: 001
Create Date: 2026-02-19

"""
from typing import Sequence, Union

from alembic import op
import sqlalchemy as sa


# revision identifiers, used by Alembic.
revision: str = "002"
down_revision: Union[str, None] = "001"
branch_labels: Union[str, Sequence[str], None] = None
depends_on: Union[str, Sequence[str], None] = None


def upgrade() -> None:
    op.create_table(
        "job_stages",
        sa.Column("job_id", sa.String(36), nullable=False),
        sa.Column("stage_name", sa.String(50), nullable=False),
        sa.Column("stage_state", sa.String(20), nullable=False),
        sa.Column("attempt", sa.Integer, nullable=False, server_default="0"),
        sa.Column("started_at", sa.DateTime(timezone=True), nullable=True),
        sa.Column("ended_at", sa.DateTime(timezone=True), nullable=True),
        sa.Column("error_code", sa.String(50), nullable=True),
        sa.Column("error_summary", sa.Text, nullable=True),
        sa.Column("log_file_path", sa.String(512), nullable=True),
        sa.Column("version", sa.Integer, nullable=False, server_default="1"),
        sa.PrimaryKeyConstraint("job_id", "stage_name"),
        sa.ForeignKeyConstraint(
            ["job_id"],
            ["jobs.job_id"],
            ondelete="CASCADE",
        ),
        sa.CheckConstraint(
            "stage_state IN ('PENDING', 'IN_PROGRESS', 'COMPLETED', 'FAILED', 'SKIPPED')",
            name="ck_stage_state",
        ),
    )

    op.create_index("ix_stages_job_id", "job_stages", ["job_id"])
    op.create_index("ix_stages_stage_state", "job_stages", ["stage_state"])
    op.create_index("ix_stages_job_stage", "job_stages", ["job_id", "stage_name"])


def downgrade() -> None:
    op.drop_index("ix_stages_job_stage", table_name="job_stages")
    op.drop_index("ix_stages_stage_state", table_name="job_stages")
    op.drop_index("ix_stages_job_id", table_name="job_stages")
    op.drop_table("job_stages")


================================================
FILE: build_stream/infra/db/alembic/versions/20260219_003_create_idempotency_keys_table.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

"""Create idempotency_keys table

Revision ID: 003
Revises: 002
Create Date: 2026-02-19

"""
from typing import Sequence, Union

from alembic import op
import sqlalchemy as sa


# revision identifiers, used by Alembic.
revision: str = "003"
down_revision: Union[str, None] = "002"
branch_labels: Union[str, Sequence[str], None] = None
depends_on: Union[str, Sequence[str], None] = None


def upgrade() -> None:
    op.create_table(
        "idempotency_keys",
        sa.Column("idempotency_key", sa.String(255), primary_key=True, nullable=False),
        sa.Column("job_id", sa.String(36), nullable=False),
        sa.Column("request_fingerprint", sa.String(64), nullable=False),
        sa.Column("client_id", sa.String(128), nullable=False),
        sa.Column("created_at", sa.DateTime(timezone=True), nullable=False),
        sa.Column("expires_at", sa.DateTime(timezone=True), nullable=False),
    )

    op.create_index("ix_idempotency_job_id", "idempotency_keys", ["job_id"])
    op.create_index("ix_idempotency_client_id", "idempotency_keys", ["client_id"])
    op.create_index("ix_idempotency_expires_at", "idempotency_keys", ["expires_at"])


def downgrade() -> None:
    op.drop_index("ix_idempotency_expires_at", table_name="idempotency_keys")
    op.drop_index("ix_idempotency_client_id", table_name="idempotency_keys")
    op.drop_index("ix_idempotency_job_id", table_name="idempotency_keys")
    op.drop_table("idempotency_keys")


================================================
FILE: build_stream/infra/db/alembic/versions/20260219_004_create_audit_events_table.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

"""Create audit_events table

Revision ID: 004
Revises: 003
Create Date: 2026-02-19

"""
from typing import Sequence, Union

from alembic import op
import sqlalchemy as sa
from sqlalchemy.dialects.postgresql import JSONB


# revision identifiers, used by Alembic.
revision: str = "004"
down_revision: Union[str, None] = "003"
branch_labels: Union[str, Sequence[str], None] = None
depends_on: Union[str, Sequence[str], None] = None


def upgrade() -> None:
    op.create_table(
        "audit_events",
        sa.Column("event_id", sa.String(36), primary_key=True, nullable=False),
        sa.Column("job_id", sa.String(36), nullable=False),
        sa.Column("event_type", sa.String(50), nullable=False),
        sa.Column("correlation_id", sa.String(36), nullable=False),
        sa.Column("client_id", sa.String(128), nullable=False),
        sa.Column("timestamp", sa.DateTime(timezone=True), nullable=False),
        sa.Column("details", JSONB, nullable=True),
    )

    op.create_index("ix_audit_job_id", "audit_events", ["job_id"])
    op.create_index("ix_audit_event_type", "audit_events", ["event_type"])
    op.create_index("ix_audit_correlation_id", "audit_events", ["correlation_id"])
    op.create_index("ix_audit_client_id", "audit_events", ["client_id"])
    op.create_index("ix_audit_timestamp", "audit_events", ["timestamp"])
    op.create_index("ix_audit_job_timestamp", "audit_events", ["job_id", "timestamp"])
    op.create_index(
        "ix_audit_client_timestamp",
        "audit_events",
        ["client_id", "timestamp"],
    )


def downgrade() -> None:
    op.drop_index("ix_audit_client_timestamp", table_name="audit_events")
    op.drop_index("ix_audit_job_timestamp", table_name="audit_events")
    op.drop_index("ix_audit_timestamp", table_name="audit_events")
    op.drop_index("ix_audit_client_id", table_name="audit_events")
    op.drop_index("ix_audit_correlation_id", table_name="audit_events")
    op.drop_index("ix_audit_event_type", table_name="audit_events")
    op.drop_index("ix_audit_job_id", table_name="audit_events")
    op.drop_table("audit_events")


================================================
FILE: build_stream/infra/db/alembic/versions/20260219_005_create_artifact_metadata_table.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

"""Create artifact_metadata table

Revision ID: 005
Revises: 004
Create Date: 2026-02-19 13:45:00.000000

"""
from typing import Sequence, Union

from alembic import op
import sqlalchemy as sa


# revision identifiers, used by Alembic.
revision: str = '005'
down_revision: Union[str, None] = '004'
branch_labels: Union[str, Sequence[str], None] = None
depends_on: Union[str, Sequence[str], None] = None


def upgrade() -> None:
    # Create artifact_metadata table
    op.create_table(
        'artifact_metadata',
        sa.Column('id', sa.String(length=36), nullable=False),
        sa.Column('job_id', sa.String(length=36), nullable=False),
        sa.Column('stage_name', sa.String(length=50), nullable=False),
        sa.Column('label', sa.String(length=100), nullable=False),
        sa.Column('artifact_ref', sa.JSON(), nullable=False),
        sa.Column('kind', sa.String(length=20), nullable=False),
        sa.Column('content_type', sa.String(length=100), nullable=False),
        sa.Column('tags', sa.JSON(), nullable=True),
        sa.Column('created_at', sa.DateTime(timezone=True), server_default=sa.text('now()'), nullable=False),
        sa.PrimaryKeyConstraint('id'),
        sa.ForeignKeyConstraint(['job_id'], ['jobs.job_id'], ondelete='CASCADE'),
    )
    
    # Create indexes for performance
    op.create_index('idx_artifact_metadata_job_id', 'artifact_metadata', ['job_id'])
    op.create_index('idx_artifact_metadata_job_label', 'artifact_metadata', ['job_id', 'label'])


def downgrade() -> None:
    # Drop indexes
    op.drop_index('idx_artifact_metadata_job_label', table_name='artifact_metadata')
    op.drop_index('idx_artifact_metadata_job_id', table_name='artifact_metadata')
    
    # Drop table
    op.drop_table('artifact_metadata')


================================================
FILE: build_stream/infra/db/alembic.ini
================================================
[alembic]
script_location = %(here)s/alembic
sqlalchemy.url = postgresql://%(DB_USER)s:%(DB_PASSWORD)s@%(DB_HOST)s:5432/%(DB_NAME)s

[loggers]
keys = root,sqlalchemy,alembic

[handlers]
keys = console

[formatters]
keys = generic

[logger_root]
level = WARN
handlers = console

[logger_sqlalchemy]
level = WARN
handlers =
qualname = sqlalchemy.engine

[logger_alembic]
level = INFO
handlers =
qualname = alembic

[handler_console]
class = StreamHandler
args = (sys.stderr,)
level = NOTSET
formatter = generic

[formatter_generic]
format = %(levelname)-5.5s [%(name)s] %(message)s
datefmt = %H:%M:%S


================================================
FILE: build_stream/infra/db/config.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Database configuration module."""

import os
from typing import Optional


class DatabaseConfig:
    """Database configuration from environment variables."""

    def __init__(self):
        self.database_url: str = os.getenv("DATABASE_URL", "")
        self.pool_size: int = int(os.getenv("DB_POOL_SIZE", "20"))
        self.max_overflow: int = int(os.getenv("DB_MAX_OVERFLOW", "10"))
        self.pool_recycle: int = int(os.getenv("DB_POOL_RECYCLE", "3600"))
        self.echo: bool = os.getenv("DB_ECHO", "false").lower() == "true"

    def validate(self) -> None:
        """Validate required configuration."""
        if not self.database_url:
            raise ValueError("DATABASE_URL environment variable is required")


# Global config instance
db_config = DatabaseConfig()


================================================
FILE: build_stream/infra/db/mappers.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Mappers for domain ↔ ORM model conversion.

Explicit mapping between domain entities and ORM models.
No domain logic lives here — only data transformation.
"""

from typing import Dict, Any

from core.jobs.entities.audit import AuditEvent
from core.jobs.entities.idempotency import IdempotencyRecord
from core.jobs.entities.job import Job
from core.jobs.entities.stage import Stage
from core.jobs.value_objects import (
    ClientId,
    CorrelationId,
    IdempotencyKey,
    JobId,
    JobState,
    RequestFingerprint,
    StageName,
    StageState,
)
from .models import AuditEventModel, IdempotencyKeyModel, JobModel, StageModel


class JobMapper:
    """Mapper for Job entity ↔ JobModel ORM."""

    @staticmethod
    def to_orm(job: Job) -> JobModel:
        """Convert Job domain entity to ORM model.

        Args:
            job: Job domain entity.

        Returns:
            JobModel ORM instance.
        """
        return JobModel(
            job_id=str(job.job_id),
            client_id=str(job.client_id),
            request_client_id=job.request_client_id,
            client_name=job.client_name,
            job_state=job.job_state.value,
            created_at=job.created_at,
            updated_at=job.updated_at,
            version=job.version,
            tombstoned=job.tombstoned,
        )

    @staticmethod
    def to_domain(model: JobModel) -> Job:
        """Convert JobModel ORM to Job domain entity.

        Args:
            model: JobModel ORM instance.

        Returns:
            Job domain entity.
        """
        return Job(
            job_id=JobId(model.job_id),
            client_id=ClientId(model.client_id),
            request_client_id=model.request_client_id,
            client_name=model.client_name,
            job_state=JobState(model.job_state),
            created_at=model.created_at,
            updated_at=model.updated_at,
            version=model.version,
            tombstoned=model.tombstoned,
        )


class StageMapper:
    """Mapper for Stage entity ↔ StageModel ORM."""

    @staticmethod
    def to_orm(stage: Stage) -> StageModel:
        """Convert Stage domain entity to ORM model.

        Args:
            stage: Stage domain entity.

        Returns:
            StageModel ORM instance.
        """
        return StageModel(
            job_id=str(stage.job_id),
            stage_name=stage.stage_name.value,
            stage_state=stage.stage_state.value,
            attempt=stage.attempt,
            started_at=stage.started_at,
            ended_at=stage.ended_at,
            error_code=stage.error_code,
            error_summary=stage.error_summary,
            log_file_path=stage.log_file_path,
            version=stage.version,
        )

    @staticmethod
    def to_domain(model: StageModel) -> Stage:
        """Convert StageModel ORM to Stage domain entity.

        Args:
            model: StageModel ORM instance.

        Returns:
            Stage domain entity.
        """
        return Stage(
            job_id=JobId(model.job_id),
            stage_name=StageName(model.stage_name),
            stage_state=StageState(model.stage_state),
            attempt=model.attempt,
            started_at=model.started_at,
            ended_at=model.ended_at,
            error_code=model.error_code,
            error_summary=model.error_summary,
            log_file_path=model.log_file_path,
            version=model.version,
        )


class IdempotencyRecordMapper:
    """Mapper for IdempotencyRecord entity ↔ IdempotencyKeyModel ORM."""

    @staticmethod
    def to_orm(record: IdempotencyRecord) -> IdempotencyKeyModel:
        """Convert IdempotencyRecord domain entity to ORM model.

        Args:
            record: IdempotencyRecord domain entity.

        Returns:
            IdempotencyKeyModel ORM instance.
        """
        return IdempotencyKeyModel(
            idempotency_key=str(record.idempotency_key),
            job_id=str(record.job_id),
            request_fingerprint=str(record.request_fingerprint),
            client_id=str(record.client_id),
            created_at=record.created_at,
            expires_at=record.expires_at,
        )

    @staticmethod
    def to_domain(model: IdempotencyKeyModel) -> IdempotencyRecord:
        """Convert IdempotencyKeyModel ORM to IdempotencyRecord domain entity.

        Args:
            model: IdempotencyKeyModel ORM instance.

        Returns:
            IdempotencyRecord domain entity.
        """
        return IdempotencyRecord(
            idempotency_key=IdempotencyKey(model.idempotency_key),
            job_id=JobId(model.job_id),
            request_fingerprint=RequestFingerprint(model.request_fingerprint),
            client_id=ClientId(model.client_id),
            created_at=model.created_at,
            expires_at=model.expires_at,
        )


class AuditEventMapper:
    """Mapper for AuditEvent entity ↔ AuditEventModel ORM."""

    @staticmethod
    def to_orm(event: AuditEvent) -> AuditEventModel:
        """Convert AuditEvent domain entity to ORM model.

        Args:
            event: AuditEvent domain entity.

        Returns:
            AuditEventModel ORM instance.
        """
        return AuditEventModel(
            event_id=event.event_id,
            job_id=str(event.job_id),
            event_type=event.event_type,
            correlation_id=str(event.correlation_id),
            client_id=str(event.client_id),
            timestamp=event.timestamp,
            details=event.details if event.details else None,
        )

    @staticmethod
    def to_domain(model: AuditEventModel) -> AuditEvent:
        """Convert AuditEventModel ORM to AuditEvent domain entity.

        Args:
            model: AuditEventModel ORM instance.

        Returns:
            AuditEvent domain entity.
        """
        return AuditEvent(
            event_id=model.event_id,
            job_id=JobId(model.job_id),
            event_type=model.event_type,
            correlation_id=CorrelationId(model.correlation_id),
            client_id=ClientId(model.client_id),
            timestamp=model.timestamp,
            details=model.details if model.details else {},
        )


================================================
FILE: build_stream/infra/db/models.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""SQLAlchemy ORM models for BuildStreaM persistence.

ORM models are infrastructure-only and never exposed outside this layer.
Domain ↔ ORM conversion is handled by mappers in mappers.py.
"""

# Third-party imports
from sqlalchemy import (
    Boolean,
    Column,
    DateTime,
    ForeignKey,
    Index,
    Integer,
    String,
    Text,
    func,
)
from sqlalchemy.dialects.postgresql import JSONB
from sqlalchemy.orm import declarative_base, relationship

Base = declarative_base()


class JobModel(Base):
    """ORM model for jobs table.

    Maps to Job domain entity via JobMapper.
    """

    __tablename__ = "jobs"

    # Primary key
    job_id = Column(String(36), primary_key=True, nullable=False)

    # Business attributes
    client_id = Column(String(128), nullable=False, index=True)
    request_client_id = Column(String(128), nullable=False)
    client_name = Column(String(128), nullable=True)
    job_state = Column(String(20), nullable=False, index=True)

    # Timestamps
    created_at = Column(DateTime(timezone=True), nullable=False, index=True)
    updated_at = Column(DateTime(timezone=True), nullable=False)

    # Optimistic locking
    version = Column(Integer, nullable=False, default=1)

    # Soft delete
    tombstoned = Column(Boolean, nullable=False, default=False, index=True)

    # Relationships
    stages = relationship(
        "StageModel",
        back_populates="job",
        cascade="all, delete-orphan",
        lazy="selectin",
    )

    # Composite indexes
    __table_args__ = (
        Index("ix_jobs_client_state", "client_id", "job_state"),
        Index("ix_jobs_created_tombstoned", "created_at", "tombstoned"),
    )


class StageModel(Base):
    """ORM model for job_stages table.

    Maps to Stage domain entity via StageMapper.
    Composite primary key: (job_id, stage_name).
    """

    __tablename__ = "job_stages"

    # Composite primary key
    job_id = Column(
        String(36),
        ForeignKey("jobs.job_id", ondelete="CASCADE"),
        primary_key=True,
        nullable=False,
    )
    stage_name = Column(String(30), primary_key=True, nullable=False)

    # Business attributes
    stage_state = Column(String(20), nullable=False, index=True)
    attempt = Column(Integer, nullable=False, default=1)

    # Timestamps
    started_at = Column(DateTime(timezone=True), nullable=True)
    ended_at = Column(DateTime(timezone=True), nullable=True)

    # Error tracking
    error_code = Column(String(50), nullable=True)
    error_summary = Column(Text, nullable=True)

    # Log file path
    log_file_path = Column(String(512), nullable=True)

    # Optimistic locking
    version = Column(Integer, nullable=False, default=1)

    # Relationships
    job = relationship("JobModel", back_populates="stages")

    # Composite indexes
    __table_args__ = (
        Index("ix_stages_job_state", "job_id", "stage_state"),
    )


class IdempotencyKeyModel(Base):
    """ORM model for idempotency_keys table.

    Maps to IdempotencyRecord domain entity via IdempotencyRecordMapper.
    """

    __tablename__ = "idempotency_keys"

    # Primary key
    idempotency_key = Column(String(255), primary_key=True, nullable=False)

    # Business attributes
    job_id = Column(String(36), nullable=False, index=True)
    request_fingerprint = Column(String(64), nullable=False)
    client_id = Column(String(128), nullable=False, index=True)

    # Timestamps
    created_at = Column(DateTime(timezone=True), nullable=False, index=True)
    expires_at = Column(DateTime(timezone=True), nullable=False, index=True)

    # Composite indexes
    __table_args__ = (
        Index("ix_idempotency_client_created", "client_id", "created_at"),
        Index("ix_idempotency_expires", "expires_at"),
    )


class AuditEventModel(Base):
    """ORM model for audit_events table.

    Maps to AuditEvent domain entity via AuditEventMapper.
    """

    __tablename__ = "audit_events"

    # Primary key
    event_id = Column(String(36), primary_key=True, nullable=False)

    # Business attributes
    job_id = Column(String(36), nullable=False, index=True)
    event_type = Column(String(50), nullable=False, index=True)
    correlation_id = Column(String(36), nullable=False, index=True)
    client_id = Column(String(128), nullable=False, index=True)

    # Timestamp
    timestamp = Column(DateTime(timezone=True), nullable=False, index=True)

    # Event details
    details = Column(JSONB, nullable=True)

    # Composite indexes
    __table_args__ = (
        Index("ix_audit_job_timestamp", "job_id", "timestamp"),
        Index("ix_audit_correlation", "correlation_id"),
        Index("ix_audit_client_timestamp", "client_id", "timestamp"),
    )


class ArtifactMetadata(Base):
    """
    SQLAlchemy model for artifact metadata storage.
    
    Maps to ArtifactRecord domain entity via SqlArtifactMetadataRepository.
    """

    __tablename__ = "artifact_metadata"

    # Primary key
    id = Column(String(36), primary_key=True, nullable=False)

    # Foreign key to jobs table
    job_id = Column(String(36), ForeignKey("jobs.job_id", ondelete="CASCADE"), nullable=False, index=True)

    # Business attributes
    stage_name = Column(String(50), nullable=False)
    label = Column(String(100), nullable=False)
    artifact_ref = Column(JSONB, nullable=False)
    kind = Column(String(20), nullable=False)
    content_type = Column(String(100), nullable=False)
    tags = Column(JSONB, nullable=True)

    # Timestamp
    created_at = Column(DateTime(timezone=True), server_default=func.now(), nullable=False)

    # Composite indexes
    __table_args__ = (
        Index("idx_artifact_metadata_job_id", "job_id"),
        Index("idx_artifact_metadata_job_label", "job_id", "label"),
    )


================================================
FILE: build_stream/infra/db/repositories.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""SQL repository implementations for BuildStreaM persistence.

These implement the repository Protocol ports defined in core/jobs/repositories.py
using SQLAlchemy ORM against PostgreSQL.
"""

from typing import List, Optional

from sqlalchemy import select
from sqlalchemy.exc import IntegrityError
from sqlalchemy.orm import Session

from core.jobs.entities.audit import AuditEvent
from core.jobs.entities.idempotency import IdempotencyRecord
from core.jobs.entities.job import Job
from core.jobs.entities.stage import Stage
from core.jobs.exceptions import OptimisticLockError
from core.jobs.value_objects import IdempotencyKey, JobId, StageName
from core.artifacts.ports import ArtifactMetadataRepository
from core.artifacts.entities import ArtifactRecord, ArtifactRef, ArtifactKind
from core.artifacts.value_objects import ArtifactKey, ArtifactDigest
from .mappers import (
    AuditEventMapper,
    IdempotencyRecordMapper,
    JobMapper,
    StageMapper,
)
from .models import AuditEventModel, IdempotencyKeyModel, JobModel, StageModel


class SqlJobRepository:
    """SQL implementation of JobRepository protocol."""

    def __init__(self, session: Session) -> None:
        """Initialize repository with database session.

        Args:
            session: SQLAlchemy session for database operations.
        """
        self.session = session

    def save(self, job: Job) -> None:
        """Persist a job aggregate.

        Uses upsert semantics: inserts if new, updates with optimistic
        locking if existing.

        Args:
            job: Job entity to persist.

        Raises:
            OptimisticLockError: If version conflict detected.
        """
        existing = self.session.get(JobModel, str(job.job_id))

        if existing:
            if existing.version != job.version - 1:
                raise OptimisticLockError(
                    entity_type="Job",
                    entity_id=str(job.job_id),
                    expected_version=job.version - 1,
                    actual_version=existing.version,
                )

            existing.client_id = str(job.client_id)
            existing.request_client_id = job.request_client_id
            existing.client_name = job.client_name
            existing.job_state = job.job_state.value
            existing.updated_at = job.updated_at
            existing.version = job.version
            existing.tombstoned = job.tombstoned
        else:
            job_model = JobMapper.to_orm(job)
            self.session.add(job_model)

        try:
            self.session.flush()
        except IntegrityError as exc:
            raise OptimisticLockError(
                entity_type="Job",
                entity_id=str(job.job_id),
                expected_version=job.version - 1,
                actual_version=-1,
            ) from exc

    def find_by_id(self, job_id: JobId) -> Optional[Job]:
        """Retrieve a job by its identifier.

        Args:
            job_id: Unique job identifier.

        Returns:
            Job entity if found, None otherwise.
        """
        job_model = self.session.get(JobModel, str(job_id))
        if job_model is None:
            return None
        return JobMapper.to_domain(job_model)

    def exists(self, job_id: JobId) -> bool:
        """Check if a job exists.

        Args:
            job_id: Unique job identifier.

        Returns:
            True if job exists, False otherwise.
        """
        stmt = select(JobModel.job_id).where(JobModel.job_id == str(job_id))
        result = self.session.execute(stmt).first()
        return result is not None


class SqlStageRepository:
    """SQL implementation of StageRepository protocol."""

    def __init__(self, session: Session) -> None:
        """Initialize repository with database session.

        Args:
            session: SQLAlchemy session for database operations.
        """
        self.session = session

    def save(self, stage: Stage) -> None:
        """Persist a single stage.

        Uses upsert semantics: inserts if new, updates with optimistic
        locking if existing.

        Args:
            stage: Stage entity to persist.

        Raises:
            OptimisticLockError: If version conflict detected.
        """
        stmt = select(StageModel).where(
            StageModel.job_id == str(stage.job_id),
            StageModel.stage_name == stage.stage_name.value,
        )
        existing = self.session.execute(stmt).scalar_one_or_none()
        
        if existing:
            if existing.version != stage.version - 1:
                raise OptimisticLockError(
                    entity_type="Stage",
                    entity_id=f"{stage.job_id}/{stage.stage_name.value}",
                    expected_version=stage.version - 1,
                    actual_version=existing.version,
                )

            existing.stage_state = stage.stage_state.value
            existing.attempt = stage.attempt
            existing.started_at = stage.started_at
            existing.ended_at = stage.ended_at
            existing.error_code = stage.error_code
            existing.error_summary = stage.error_summary
            existing.log_file_path = stage.log_file_path
            existing.version = stage.version
        else:
            stage_model = StageMapper.to_orm(stage)
            self.session.add(stage_model)

        try:
            self.session.flush()
        except IntegrityError as exc:
            raise OptimisticLockError(
                entity_type="Stage",
                entity_id=f"{stage.job_id}/{stage.stage_name}",
                expected_version=stage.version - 1,
                actual_version=-1,
            ) from exc

    def save_all(self, stages: List[Stage]) -> None:
        """Persist multiple stages atomically.

        Args:
            stages: List of stage entities to persist.

        Raises:
            OptimisticLockError: If version conflict detected.
        """
        for stage in stages:
            self.save(stage)

    def find_by_job_and_name(
        self,
        job_id: JobId,
        stage_name: StageName,
    ) -> Optional[Stage]:
        """Retrieve a stage by job and stage name.

        Args:
            job_id: Parent job identifier.
            stage_name: Stage identifier.

        Returns:
            Stage entity if found, None otherwise.
        """
        stmt = select(StageModel).where(
            StageModel.job_id == str(job_id),
            StageModel.stage_name == str(stage_name),
        )
        stage_model = self.session.execute(stmt).scalar_one_or_none()
        if stage_model is None:
            return None
        return StageMapper.to_domain(stage_model)

    def find_all_by_job(self, job_id: JobId) -> List[Stage]:
        """Retrieve all stages for a job.

        Args:
            job_id: Parent job identifier.

        Returns:
            List of stage entities (may be empty).
        """
        stmt = (
            select(StageModel)
            .where(StageModel.job_id == str(job_id))
            .order_by(StageModel.stage_name)
        )
        stage_models = self.session.execute(stmt).scalars().all()
        return [StageMapper.to_domain(model) for model in stage_models]


class SqlIdempotencyRepository:
    """SQL implementation of IdempotencyRepository protocol."""

    def __init__(self, session: Session) -> None:
        """Initialize repository with database session.

        Args:
            session: SQLAlchemy session for database operations.
        """
        self.session = session

    def save(self, record: IdempotencyRecord) -> None:
        """Persist an idempotency record.

        Args:
            record: Idempotency record to persist.
        """
        record_model = IdempotencyRecordMapper.to_orm(record)
        self.session.merge(record_model)
        self.session.flush()

    def find_by_key(self, key: IdempotencyKey) -> Optional[IdempotencyRecord]:
        """Retrieve an idempotency record by key.

        Args:
            key: Idempotency key.

        Returns:
            IdempotencyRecord if found, None otherwise.
        """
        record_model = self.session.get(IdempotencyKeyModel, str(key))
        if record_model is None:
            return None
        return IdempotencyRecordMapper.to_domain(record_model)


class SqlAuditEventRepository:
    """SQL implementation of AuditEventRepository protocol."""

    def __init__(self, session: Session) -> None:
        """Initialize repository with database session.

        Args:
            session: SQLAlchemy session for database operations.
        """
        self.session = session

    def save(self, event: AuditEvent) -> None:
        """Persist an audit event.

        Args:
            event: Audit event to persist.
        """
        event_model = AuditEventMapper.to_orm(event)
        self.session.add(event_model)
        self.session.flush()

    def find_by_job(self, job_id: JobId) -> List[AuditEvent]:
        """Retrieve all audit events for a job.

        Args:
            job_id: Job identifier.

        Returns:
            List of audit events (may be empty).
        """
        stmt = (
            select(AuditEventModel)
            .where(AuditEventModel.job_id == str(job_id))
            .order_by(AuditEventModel.timestamp)
        )
        event_models = self.session.execute(stmt).scalars().all()
        return [AuditEventMapper.to_domain(model) for model in event_models]


class SqlArtifactMetadataRepository(ArtifactMetadataRepository):
    """SQL implementation of artifact metadata repository."""

    def __init__(self, session: Session):
        """Initialize with a SQLAlchemy session."""
        self._session = session

    def save(self, record: ArtifactRecord) -> None:
        """Save an artifact record to the database."""
        from infra.db.models import ArtifactMetadata
        
        db_record = ArtifactMetadata(
            id=record.id,
            job_id=str(record.job_id),
            stage_name=record.stage_name.value,
            label=record.label,
            artifact_ref={
                "key": str(record.artifact_ref.key),
                "digest": str(record.artifact_ref.digest),
                "size_bytes": record.artifact_ref.size_bytes,
                "uri": record.artifact_ref.uri,
            },
            kind=record.kind.value,
            content_type=record.content_type,
            tags=record.tags,
        )
        self._session.add(db_record)

    def get_by_job_id_and_label(
        self, job_id: JobId, label: str
    ) -> Optional[ArtifactRecord]:
        """Get artifact record by job ID and label."""
        from infra.db.models import ArtifactMetadata
        
        db_record = (
            self._session.query(ArtifactMetadata)
            .filter(
                ArtifactMetadata.job_id == str(job_id),
                ArtifactMetadata.label == label,
            )
            .first()
        )
        
        if not db_record:
            return None
            
        return self._db_record_to_entity(db_record)

    def find_by_job_stage_and_label(
        self,
        job_id: JobId,
        stage_name: StageName,
        label: str,
    ) -> Optional[ArtifactRecord]:
        """Find an artifact record by job, stage, and label."""
        from infra.db.models import ArtifactMetadata
        
        db_record = (
            self._session.query(ArtifactMetadata)
            .filter(
                ArtifactMetadata.job_id == str(job_id),
                ArtifactMetadata.stage_name == stage_name.value,
                ArtifactMetadata.label == label,
            )
            .first()
        )
        
        if not db_record:
            return None
            
        return self._db_record_to_entity(db_record)

    def list_by_job_id(self, job_id: JobId) -> List[ArtifactRecord]:
        """List all artifact records for a job."""
        from infra.db.models import ArtifactMetadata
        
        db_records = (
            self._session.query(ArtifactMetadata)
            .filter(ArtifactMetadata.job_id == str(job_id))
            .all()
        )
        
        return [self._db_record_to_entity(r) for r in db_records]

    def _db_record_to_entity(self, db_record) -> ArtifactRecord:
        """Convert database record to domain entity."""
        from infra.db.models import ArtifactMetadata
        
        artifact_ref_data = db_record.artifact_ref
        artifact_ref = ArtifactRef(
            key=ArtifactKey(artifact_ref_data["key"]),
            digest=ArtifactDigest(artifact_ref_data["digest"]),
            size_bytes=artifact_ref_data["size_bytes"],
            uri=artifact_ref_data["uri"],
        )
        
        return ArtifactRecord(
            id=db_record.id,
            job_id=JobId(db_record.job_id),
            stage_name=StageName(db_record.stage_name),
            label=db_record.label,
            artifact_ref=artifact_ref,
            kind=ArtifactKind(db_record.kind),
            content_type=db_record.content_type,
            tags=db_record.tags or {},
        )


================================================
FILE: build_stream/infra/db/session.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Database session management.

Engine and session factory are lazily initialized on first use.
This allows the module to be imported safely even when DATABASE_URL
is not set (e.g. in dev mode with in-memory repositories).
"""

from contextlib import contextmanager
from typing import Generator, Optional

from sqlalchemy import create_engine
from sqlalchemy.engine import Engine
from sqlalchemy.orm import Session, sessionmaker

from .config import db_config

_engine: Optional[Engine] = None
_session_factory: Optional[sessionmaker] = None


def _get_engine() -> Engine:
    """Lazily create and cache the SQLAlchemy engine.

    Raises:
        ValueError: If DATABASE_URL is not configured.
    """
    global _engine
    if _engine is None:
        db_config.validate()
        _engine = create_engine(
            db_config.database_url,
            pool_size=db_config.pool_size,
            max_overflow=db_config.max_overflow,
            pool_recycle=db_config.pool_recycle,
            echo=db_config.echo,
        )
    return _engine


def _get_session_factory() -> sessionmaker:
    """Lazily create and cache the session factory."""
    global _session_factory
    if _session_factory is None:
        _session_factory = sessionmaker(
            autocommit=False,
            autoflush=False,
            bind=_get_engine(),
        )
    return _session_factory


def SessionLocal() -> Session:
    """Create a new database session.

    Returns:
        A new SQLAlchemy Session instance.

    Raises:
        ValueError: If DATABASE_URL is not configured.
    """
    return _get_session_factory()()


@contextmanager
def get_db_session() -> Generator[Session, None, None]:
    """
    Context manager for database sessions.

    Usage:
        with get_db_session() as session:
            session.add(obj)
            session.commit()
    """
    session = SessionLocal()
    try:
        yield session
        session.commit()
    except Exception:
        session.rollback()
        raise
    finally:
        session.close()


def get_db() -> Generator[Session, None, None]:
    """FastAPI dependency for database sessions."""
    db = SessionLocal()
    try:
        yield db
    finally:
        db.close()


================================================
FILE: build_stream/infra/id_generator.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Infrastructure layer for JobId/UUID generation using UUID v4."""

import uuid

from core.jobs.exceptions import JobDomainError
from core.jobs.repositories import JobIdGenerator, UUIDGenerator
from core.jobs.value_objects import JobId


class JobUUIDGenerator(JobIdGenerator):  # pylint: disable=R0903
    """JobId generator using UUID v4."""

    def generate(self) -> JobId:
        """Generate a new JobId using UUID v4.
        
        Returns:
            JobId: A new job identifier.
            
        Raises:
            JobDomainError: If JobId generation fails.
        """
        try:
            return JobId(str(uuid.uuid4()))
        except ValueError:
            raise
        except Exception as exc:
            raise JobDomainError(f"Failed to generate JobId: {exc}") from exc


class UUIDv4Generator(UUIDGenerator):  # pylint: disable=R0903
    """UUID v4 generator for general purpose use (returns uuid.UUID)."""

    def generate(self) -> uuid.UUID:
        """Generate a new UUID v4.
        
        Returns:
            uuid.UUID: A new UUID v4 instance.
        """
        return uuid.uuid4()


================================================
FILE: build_stream/infra/repositories/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

from infra.repositories.in_memory import (
    InMemoryJobRepository,
    InMemoryStageRepository,
    InMemoryIdempotencyRepository,
    InMemoryAuditEventRepository,
)
from infra.repositories.nfs_playbook_queue_request_repository import NfsPlaybookQueueRequestRepository
from infra.repositories.nfs_playbook_queue_result_repository import NfsPlaybookQueueResultRepository
from infra.repositories.nfs_input_repository import NfsInputRepository

__all__ = [
    "InMemoryJobRepository",
    "InMemoryStageRepository",
    "InMemoryIdempotencyRepository",
    "InMemoryAuditEventRepository",
    "NfsPlaybookQueueRequestRepository",
    "NfsPlaybookQueueResultRepository",
    "NfsInputRepository",
]


================================================
FILE: build_stream/infra/repositories/in_memory.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

""" This file contains in-memory implementations of the job repository.
    It is used in testing and development."""

from typing import Dict, List, Optional

from core.jobs.entities import Job, Stage, IdempotencyRecord, AuditEvent
from core.jobs.value_objects import JobId, IdempotencyKey, StageName

class InMemoryJobRepository:
    """In-memory implementation of Job repository for testing."""

    def __init__(self) -> None:
        """Initialize the repository with empty job storage."""
        self._jobs: Dict[str, Job] = {}

    def save(self, job: Job) -> None:
        """Save a job to the in-memory storage."""
        self._jobs[str(job.job_id)] = job

    def find_by_id(self, job_id: JobId) -> Optional[Job]:
        """Find a job by its ID."""
        return self._jobs.get(str(job_id))

    def exists(self, job_id: JobId) -> bool:
        """Check if a job exists by its ID."""
        return str(job_id) in self._jobs


class InMemoryStageRepository:
    """In-memory implementation of Stage repository for testing."""

    def __init__(self) -> None:
        """Initialize the repository with empty stage storage."""
        self._stages: Dict[str, List[Stage]] = {}

    def save(self, stage: Stage) -> None:
        """Save a stage to the in-memory storage."""
        job_key = str(stage.job_id)
        if job_key not in self._stages:
            self._stages[job_key] = []

        existing = self.find_by_job_and_name(stage.job_id, stage.stage_name)
        if existing:
            stages = self._stages[job_key]
            self._stages[job_key] = [
                s for s in stages if str(s.stage_name) != str(stage.stage_name)
            ]

        self._stages[job_key].append(stage)

    def save_all(self, stages: List[Stage]) -> None:
        """Save multiple stages to the in-memory storage."""
        for stage in stages:
            self.save(stage)

    def find_by_job_and_name(
        self, job_id: JobId, stage_name: StageName
    ) -> Optional[Stage]:
        """Find a stage by job ID and stage name."""
        job_key = str(job_id)
        if job_key not in self._stages:
            return None

        for stage in self._stages[job_key]:
            if str(stage.stage_name) == str(stage_name):
                return stage
        return None

    def find_all_by_job(self, job_id: JobId) -> List[Stage]:
        """Find all stages for a given job ID."""
        return self._stages.get(str(job_id), [])


class InMemoryIdempotencyRepository:
    """In-memory implementation of Idempotency repository for testing."""

    def __init__(self) -> None:
        """Initialize the repository with empty idempotency storage."""
        self._records: Dict[str, IdempotencyRecord] = {}

    def save(self, record: IdempotencyRecord) -> None:
        """Save an idempotency record to the in-memory storage."""
        self._records[str(record.idempotency_key)] = record

    def find_by_key(self, key: IdempotencyKey) -> Optional[IdempotencyRecord]:
        """Find an idempotency record by its key."""
        return self._records.get(str(key))


class InMemoryAuditEventRepository:
    """In-memory implementation of AuditEvent repository for testing."""

    def __init__(self) -> None:
        """Initialize the repository with empty audit event storage."""
        self._events: Dict[str, List[AuditEvent]] = {}

    def save(self, event: AuditEvent) -> None:
        """Save an audit event to the in-memory storage."""
        job_key = str(event.job_id)
        if job_key not in self._events:
            self._events[job_key] = []
        self._events[job_key].append(event)

    def find_by_job(self, job_id: JobId) -> List[AuditEvent]:
        """Find all audit events for a given job ID."""
        return self._events.get(str(job_id), [])


================================================
FILE: build_stream/infra/repositories/nfs_build_image_inventory_repository.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""NFS-based implementation of BuildImageInventoryRepository."""

import logging
from pathlib import Path

from core.build_image.value_objects import InventoryHost

logger = logging.getLogger(__name__)

DEFAULT_INVENTORY_DIR = "/opt/omnia/build_stream_inv"
DEFAULT_INVENTORY_FILENAME = "inv"


class NfsBuildImageInventoryRepository:
    """NFS shared volume implementation for build image inventory file management.

    Creates and manages Ansible inventory files for aarch64 builds.
    """

    def __init__(
        self,
        inventory_dir: str = DEFAULT_INVENTORY_DIR,
        inventory_filename: str = DEFAULT_INVENTORY_FILENAME,
    ) -> None:
        """Initialize repository with inventory directory path.

        Args:
            inventory_dir: Directory path for inventory files.
            inventory_filename: Name of the inventory file.
        """
        self._inventory_dir = Path(inventory_dir)
        self._inventory_filename = inventory_filename

    def create_inventory_file(self, inventory_host: InventoryHost, job_id: str) -> Path:
        """Create an inventory file for aarch64 builds.

        Args:
            inventory_host: The inventory host IP address.
            job_id: Job identifier for tracking.

        Returns:
            Path to the created inventory file.

        Raises:
            IOError: If inventory file cannot be created.
        """
        # Ensure inventory directory exists
        try:
            self._inventory_dir.mkdir(parents=True, exist_ok=True)
        except OSError as exc:
            logger.error("Failed to create inventory directory: %s", self._inventory_dir)
            raise IOError("Failed to create inventory directory") from None

        inventory_file_path = self._inventory_dir / self._inventory_filename

        # Create inventory file content
        inventory_content = f"[admin_aarch64]\n{str(inventory_host)}\n"

        try:
            with open(inventory_file_path, "w", encoding="utf-8") as inv_file:
                inv_file.write(inventory_content)

            logger.info(
                "Created inventory file for job %s at %s with host %s",
                job_id,
                inventory_file_path,
                str(inventory_host),
            )
            return inventory_file_path

        except OSError as exc:
            logger.error(
                "Failed to write inventory file %s for job %s",
                inventory_file_path,
                job_id,
            )
            raise IOError("Failed to write inventory file") from None


================================================
FILE: build_stream/infra/repositories/nfs_input_repository.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Consolidated NFS-based implementation for input directory and configuration management."""

import logging
import os
from pathlib import Path
from typing import Optional

import yaml

from common.config import load_config
from core.build_image.repositories import (
    BuildStreamConfigRepository,
    BuildImageInventoryRepository,
)
from core.build_image.value_objects import InventoryHost

logger = logging.getLogger(__name__)

# Load configuration to get base path
try:
    local_config = load_config()
    DEFAULT_BUILD_STREAM_BASE = Path(local_config.file_store.base_path)
except (FileNotFoundError, AttributeError):
    # Fallback to default path if config is not available
    DEFAULT_BUILD_STREAM_BASE = Path("/opt/omnia/build_stream_root")

DEFAULT_PLAYBOOK_INPUT_DIR = "/opt/omnia/input/project_default/"


def _read_project_name(default_file_path: str = "/opt/omnia/input/default.yml") -> str:
    """Read project_name from default.yml.

    Args:
        default_file_path: Path to default.yml file.

    Returns:
        Project name (e.g., "project_default"). Returns 'project_default' fallback on any error.
    """
    default_path = Path(default_file_path)
    if not default_path.exists():
        return "project_default"

    try:
        with open(default_path, "r", encoding="utf-8") as f:
            config = yaml.safe_load(f)
        if not config or "project_name" not in config:
            return "project_default"
        return str(config["project_name"])
    except yaml.YAMLError:
        return "project_default"
    except Exception:
        return "project_default"


class NfsInputRepository(BuildStreamConfigRepository, BuildImageInventoryRepository):
    """Consolidated NFS repository for input directory and configuration management.

    This repository combines functionality for:
    - Input directory path management
    - Configuration file reading
    - Inventory file creation

    Manages paths for input files generated by the GenerateInputFiles API,
    reads build stream configuration, and creates inventory files for aarch64 builds.
    """

    def __init__(
        self,
        config_file_path: Optional[str] = None,
        default_file_path: str = "/opt/omnia/input/default.yml",
        playbook_input_dir: str = DEFAULT_PLAYBOOK_INPUT_DIR,
        build_stream_base: str = DEFAULT_BUILD_STREAM_BASE,
        inventory_base_dir: str = "/opt/omnia/build_stream_inv",
    ):
        """Initialize repository with consolidated paths.

        Args:
            config_file_path: Full path to build_stream_config.yml. If None, constructed
                             using project_name from default.yml.
            default_file_path: Path to default.yml to read project_name.
            playbook_input_dir: Destination path expected by playbook.
            build_stream_base: Base path for build stream job data.
            inventory_base_dir: Base directory for inventory files.
        """
        # Initialize configuration paths
        if config_file_path is None:
            project_name = _read_project_name(default_file_path)
            config_file_path = f"/opt/omnia/input/{project_name}/build_stream_config.yml"
        self._config_file_path = Path(config_file_path)

        # Initialize input directory paths
        self._playbook_input_dir = Path(playbook_input_dir)
        self._build_stream_base = Path(build_stream_base)

        # Initialize inventory directory paths
        self._inventory_base_dir = Path(inventory_base_dir)

    # === Configuration Methods ===

    def get_aarch64_inv_host(self, job_id: str) -> Optional[InventoryHost]:
        """Retrieve aarch64 inventory host IP from build_stream_config.yml.

        Args:
            job_id: Job identifier.

        Returns:
            Inventory host IP address or None if not configured.

        Raises:
            ConfigurationError: If config file is invalid or inaccessible.
        """
        config_path = self._config_file_path

        if not config_path.exists():
            logger.warning(
                "build_stream_config.yml not found at %s (job %s)",
                job_id,
                config_path,
            )
            return None

        try:
            with open(config_path, "r", encoding="utf-8") as f:
                config = yaml.safe_load(f)
                
            if not config:
                logger.warning("Empty build_stream_config.yml for job %s", job_id)
                return None
                
            inventory_host = config.get("aarch64_inventory_host_ip")
            if inventory_host:
                logger.info(
                    "Retrieved inventory_host for job %s: %s",
                    job_id,
                    inventory_host,
                )
                return InventoryHost(str(inventory_host))
            
            logger.info("No aarch64_inventory_host_ip configured for job %s", job_id)
            return None
            
        except yaml.YAMLError as exc:
            logger.error(
                "Failed to parse build_stream_config.yml for job %s",
                job_id,
            )
            return None
        except Exception as exc:
            logger.error(
                "Unexpected error reading build_stream_config.yml for job %s",
                job_id,
            )
            return None

    # === Inventory File Methods ===

    def create_inventory_file(self, inventory_host: InventoryHost, job_id: str) -> Path:
        """Create an inventory file for aarch64 builds.

        Args:
            inventory_host: The inventory host IP address.
            job_id: Job identifier for tracking.

        Returns:
            Path to the created inventory file.

        Raises:
            IOError: If inventory file cannot be created.
        """
        try:
            # Create inventory directory if it doesn't exist
            inventory_dir = self._inventory_base_dir / job_id
            inventory_dir.mkdir(parents=True, exist_ok=True)

            # Create inventory file path
            inventory_file = inventory_dir / "inv"

            # Create inventory content
            inventory_content = f"[admin_aarch64]\n{inventory_host.value}\n"

            # Write inventory file
            with open(inventory_file, "w", encoding="utf-8") as f:
                f.write(inventory_content)

            logger.info(
                "Created inventory file for job %s at %s with host %s",
                job_id,
                inventory_file,
                inventory_host.value,
            )

            return inventory_file

        except (OSError, IOError) as exc:
            logger.error(
                "Failed to create inventory file for job %s",
                job_id,
            )
            raise IOError("Cannot create inventory file") from None

    # === Input Directory Management Methods ===

    def get_source_input_repository_path(self, job_id: str) -> Path:
        """Get source input directory path for a job.

        Args:
            job_id: Job identifier.

        Returns:
            Path like <omnia/build_stream_root>/artifacts/{job_id}/input/
        """
        return self._build_stream_base / job_id / "input"

    def get_destination_input_repository_path(self) -> Path:
        """Get destination input directory path expected by playbook.

        Returns:
            Path like /opt/omnia/input/project_default/
        """
        return self._playbook_input_dir

    def validate_input_directory(self, path: Path) -> bool:
        """Validate that input directory exists and contains required files.

        Args:
            path: Path to the input directory to validate.

        Returns:
            True if directory is valid and contains at least one file.
        """
        if not path.is_dir():
            logger.warning("Input directory does not exist: %s", path)
            return False

        has_files = any(path.iterdir())
        if not has_files:
            logger.warning("Input directory is empty: %s", path)
            return False

        return True


================================================
FILE: build_stream/infra/repositories/nfs_playbook_queue_request_repository.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""NFS-based implementation of PlaybookQueueRequestRepository."""

import json
import logging
import os
import stat
from pathlib import Path
from typing import TYPE_CHECKING

if TYPE_CHECKING:
    from typing import Final

from api.logging_utils import log_secure_info
from core.localrepo.entities import PlaybookRequest
from core.localrepo.exceptions import QueueUnavailableError

logger = logging.getLogger(__name__)

DEFAULT_QUEUE_BASE = "/opt/omnia/playbook_queue"
REQUEST_DIR_NAME = "requests"
FILE_PERMISSIONS = stat.S_IRUSR | stat.S_IWUSR  # 600


class NfsPlaybookQueueRequestRepository:
    """NFS shared volume implementation for playbook request queue.

    Writes playbook request JSON files to the NFS requests directory
    for consumption by the OIM Core watcher service.
    """

    def __init__(self, queue_base_path: str = DEFAULT_QUEUE_BASE) -> None:
        """Initialize repository with queue base path.

        Args:
            queue_base_path: Base path for the playbook queue on NFS.
        """
        self._queue_base = Path(queue_base_path)
        self._requests_dir = self._queue_base / REQUEST_DIR_NAME

    def write_request(self, request: PlaybookRequest) -> Path:
        """Write a playbook request file to the requests directory.

        Args:
            request: Playbook request to write.

        Returns:
            Path to the written request file.

        Raises:
            QueueUnavailableError: If the queue directory is not accessible.
        """
        if not self.is_available():
            raise QueueUnavailableError(
                queue_path=str(self._requests_dir),
                reason="Request queue directory does not exist or is not writable",
            )

        filename = request.generate_filename()
        file_path = self._requests_dir / filename

        try:
            request_data = request.to_dict()
            with open(file_path, "w", encoding="utf-8") as request_file:
                json.dump(request_data, request_file, indent=2)

            os.chmod(file_path, FILE_PERMISSIONS)

            log_secure_info(
                "info",
                f"Request file written for job {request.job_id}",
                str(request.correlation_id),
            )
            return file_path

        except OSError as exc:
            log_secure_info(
                "error",
                "Failed to write request file",
            )
            raise QueueUnavailableError(
                queue_path=str(self._requests_dir),
                reason=f"Failed to write request file: {exc}",
            ) from exc

    def is_available(self) -> bool:
        """Check if the request queue directory is accessible.

        Returns:
            True if the queue directory exists and is writable.
        """
        return self._requests_dir.is_dir() and os.access(
            self._requests_dir, os.W_OK
        )

    def ensure_directories(self) -> None:
        """Create queue directories if they do not exist."""
        self._requests_dir.mkdir(parents=True, exist_ok=True)
        logger.info("Request queue directory ensured: %s", self._requests_dir)


================================================
FILE: build_stream/infra/repositories/nfs_playbook_queue_result_repository.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""NFS-based implementation of PlaybookQueueResultRepository."""

import json
import logging
import os
import shutil
from pathlib import Path
from typing import List, Set

from api.logging_utils import log_secure_info

from core.localrepo.entities import PlaybookResult

logger = logging.getLogger(__name__)

DEFAULT_QUEUE_BASE = "/opt/omnia/playbook_queue"
RESULTS_DIR_NAME = "results"
ARCHIVE_DIR_NAME = "archive/results"


class NfsPlaybookQueueResultRepository:
    """NFS shared volume implementation for playbook result queue.

    Reads playbook result JSON files from the NFS results directory
    written by the OIM Core watcher service.
    """

    def __init__(self, queue_base_path: str = DEFAULT_QUEUE_BASE) -> None:
        """Initialize repository with queue base path.

        Args:
            queue_base_path: Base path for the playbook queue on NFS.
        """
        self._queue_base = Path(queue_base_path)
        self._results_dir = self._queue_base / RESULTS_DIR_NAME
        self._archive_dir = self._queue_base / ARCHIVE_DIR_NAME
        self._processed_files: Set[str] = set()
        # Clear cache on startup to ensure we don't miss any files
        self.clear_processed_cache()
        logger.info("Initialized NfsPlaybookQueueResultRepository with cleared cache")

    def get_unprocessed_results(self) -> List[Path]:
        """Return list of result files not yet processed.

        Returns:
            List of paths to unprocessed result JSON files.
        """
        result_files = []
        
        # Check results directory
        if self._results_dir.is_dir():
            for file_path in sorted(self._results_dir.glob("*.json")):
                if file_path.name not in self._processed_files:
                    result_files.append(file_path)
        

        return result_files

    def read_result(self, result_path: Path) -> PlaybookResult:
        """Read and parse a result file.

        Args:
            result_path: Path to the result JSON file.

        Returns:
            Parsed PlaybookResult entity.

        Raises:
            ValueError: If the result file is malformed.
            FileNotFoundError: If the result file does not exist.
        """
        try:
            with open(result_path, "r", encoding="utf-8") as result_file:
                data = json.load(result_file)

            required_fields = {"job_id", "stage_name", "status"}
            missing = required_fields - set(data.keys())
            if missing:
                raise ValueError(
                    f"Result file {result_path} missing required fields: {missing}"
                )

            return PlaybookResult.from_dict(data)

        except json.JSONDecodeError as exc:
            raise ValueError(
                f"Invalid JSON in result file {result_path}: {exc}"
            ) from exc

    def archive_result(self, result_path: Path) -> None:
        """Move a processed result file to the archive directory.

        Args:
            result_path: Path to the result file to archive.
        """
        self._archive_dir.mkdir(parents=True, exist_ok=True)
        archive_path = self._archive_dir / result_path.name

        try:
            # Only move if not already in archive
            if result_path.parent != self._archive_dir:
                shutil.move(str(result_path), str(archive_path))
                log_secure_info(
                    "info",
                    "Result file moved to archive",
                )
            else:
                log_secure_info(
                    "info",
                    "Result file already in archive",
                )
            self._processed_files.add(result_path.name)
        except OSError:  # pylint: disable=unused-variable
            log_secure_info(
                "error",
                "Failed to archive result file",
            )

    def is_available(self) -> bool:
        """Check if the result queue directory is accessible.

        Returns:
            True if the queue directory exists and is readable.
        """
        return self._results_dir.is_dir() and os.access(
            self._results_dir, os.R_OK
        )

    def ensure_directories(self) -> None:
        """Create queue directories if they do not exist."""
        self._results_dir.mkdir(parents=True, exist_ok=True)
        self._archive_dir.mkdir(parents=True, exist_ok=True)
        logger.info("Result queue directories ensured: %s", self._results_dir)

    def clear_processed_cache(self) -> None:
        """Clear the in-memory set of processed file names."""
        self._processed_files.clear()


================================================
FILE: build_stream/main.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Build Stream API Server.

Main entry point for the Build Stream API application.
This module initializes the FastAPI application and is invoked from the Dockerfile.

Usage:
    uvicorn main:app --host 0.0.0.0 --port $PORT
"""

import logging
import os
from contextlib import asynccontextmanager

from fastapi import FastAPI, status
from fastapi.middleware.cors import CORSMiddleware
from fastapi.responses import JSONResponse

from api.router import api_router
from container import container

LOG_LEVEL = os.getenv("LOG_LEVEL", "INFO").upper()
logging.basicConfig(
    level=getattr(logging, LOG_LEVEL, logging.INFO),
    format="%(asctime)s - %(name)s - %(levelname)s - %(message)s",
)
logger = logging.getLogger(__name__)

container.wire(modules=[
    "api.jobs.routes",
    "api.jobs.dependencies",
    "api.local_repo.routes",
    "api.local_repo.dependencies",
    "api.validate.routes",
    "api.validate.dependencies",
])
logger.info("Using container: %s", container.__class__.__name__)


@asynccontextmanager
async def lifespan(app: FastAPI):
    """Manage application lifecycle events.
    
    Starts the result poller on startup and stops it on shutdown.
    """
    # Startup: Start the result poller
    result_poller = container.result_poller()
    await result_poller.start()
    logger.info("Application startup complete")

    yield

    # Shutdown: Stop the result poller
    await result_poller.stop()
    logger.info("Application shutdown complete")


app = FastAPI(
    title="Build Stream API",
    description="RESTful API for the Omnia Build Stream application",
    version="1.0.0",
    docs_url="/docs",
    redoc_url="/redoc",
    openapi_url="/openapi.json",
    lifespan=lifespan,
)

# Attach container to app so dependency_injector Provide dependencies resolve
app.container = container

app.add_middleware(
    CORSMiddleware,
    allow_origins=os.getenv("CORS_ORIGINS", "*").split(","),
    allow_credentials=True,
    allow_methods=["*"],
    allow_headers=["*"],
)

app.include_router(api_router)


@app.get(
    "/",
    summary="Root endpoint",
    description="Returns a welcome message and API documentation URL.",
)
async def root() -> dict:
    """Root endpoint returning welcome message."""
    return {
        "message": "Welcome to Build Stream API",
        "docs": "/docs",
        "version": "1.0.0",
    }


@app.get(
    "/health",
    summary="Health check",
    description="Returns the health status of the API server.",
    status_code=status.HTTP_200_OK,
)
async def health_check() -> dict:
    """Health check endpoint for container orchestration."""
    return {"status": "healthy"}


@app.exception_handler(Exception)
async def global_exception_handler(request, exc):  # pylint: disable=unused-argument
    """Global exception handler for unhandled exceptions."""
    logger.exception("Unhandled exception occurred")
    return JSONResponse(
        status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
        content={"status": "error", "message": "An internal server error occurred"},
    )


def get_server_config():
    """Get server host and port configuration with proper validation."""
    host = os.getenv("HOST", "0.0.0.0")
    
    # Validate host is not empty or just whitespace
    if not host or host.strip() == "":
        raise ValueError("HOST environment variable cannot be empty")
    
    # Port validation
    port_env = os.getenv("PORT")
    if not port_env:
        raise ValueError("PORT environment variable is required")
    
    try:
        port = int(port_env)
        if not (1 <= port <= 65535):
            raise ValueError(f"Port {port} is not in valid range 1-65535")
    except ValueError as e:
        if "invalid literal" in str(e):
            raise ValueError(f"PORT environment variable must be a valid integer, got: {port_env}")
        raise
    
    return host.strip(), port


if __name__ == "__main__":
    import uvicorn

    try:
        host, port = get_server_config()

        logger.info("Starting Build Stream API server on %s:%d", host, port)
        
        uvicorn.run("main:app", host=host, port=port)
    except ValueError as e:
        raise ValueError("Invalid server configuration")
    except Exception as e:
        raise RuntimeError("Internal server error")


================================================
FILE: build_stream/orchestrator/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


================================================
FILE: build_stream/orchestrator/build_image/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Build Image orchestration module."""

from orchestrator.build_image.commands import CreateBuildImageCommand
from orchestrator.build_image.dtos import BuildImageResponse
from orchestrator.build_image.use_cases import CreateBuildImageUseCase

__all__ = [
    "CreateBuildImageCommand",
    "BuildImageResponse",
    "CreateBuildImageUseCase",
]


================================================
FILE: build_stream/orchestrator/build_image/commands/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Build Image command DTOs."""

from orchestrator.build_image.commands.create_build_image import CreateBuildImageCommand

__all__ = ["CreateBuildImageCommand"]


================================================
FILE: build_stream/orchestrator/build_image/commands/create_build_image.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""CreateBuildImage command DTO."""

from dataclasses import dataclass
from typing import List, Optional

from core.jobs.value_objects import ClientId, CorrelationId, JobId


@dataclass(frozen=True)
class CreateBuildImageCommand:
    """Command to trigger build image stage.

    Immutable command object representing the intent to execute
    the build-image stage for a given job.

    Attributes:
        job_id: Job identifier from URL path.
        client_id: Client who owns this job (from auth).
        correlation_id: Request correlation identifier for tracing.
        architecture: Target architecture (x86_64 or aarch64).
        image_key: Image identifier key.
        functional_groups: List of functional groups to build.
    """

    job_id: JobId
    client_id: ClientId
    correlation_id: CorrelationId
    architecture: str
    image_key: str
    functional_groups: List[str]


================================================
FILE: build_stream/orchestrator/build_image/dtos/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Build Image response DTOs."""

from orchestrator.build_image.dtos.build_image_response import BuildImageResponse

__all__ = ["BuildImageResponse"]


================================================
FILE: build_stream/orchestrator/build_image/dtos/build_image_response.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Build Image response DTO."""

from dataclasses import dataclass
from typing import List


@dataclass(frozen=True)
class BuildImageResponse:
    """Response DTO for build image stage acceptance.

    Attributes:
        job_id: Job identifier.
        stage_name: Stage identifier.
        status: Acceptance status.
        submitted_at: Submission timestamp (ISO 8601).
        correlation_id: Correlation identifier.
        architecture: Target architecture.
        image_key: Image identifier key.
        functional_groups: List of functional groups to build.
    """

    job_id: str
    stage_name: str
    status: str
    submitted_at: str
    correlation_id: str
    architecture: str
    image_key: str
    functional_groups: List[str]


================================================
FILE: build_stream/orchestrator/build_image/use_cases/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Build Image use cases."""

from orchestrator.build_image.use_cases.create_build_image import CreateBuildImageUseCase

__all__ = ["CreateBuildImageUseCase"]


================================================
FILE: build_stream/orchestrator/build_image/use_cases/create_build_image.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""CreateBuildImage use case implementation."""

import logging
from datetime import datetime, timezone
from pathlib import Path
from typing import Optional

from api.logging_utils import log_secure_info

from core.build_image.entities import BuildImageRequest
from core.build_image.exceptions import (
    InvalidArchitectureError,
    InvalidImageKeyError,
    InvalidFunctionalGroupsError,
    InventoryHostMissingError,
)
from core.build_image.repositories import (
    BuildStreamConfigRepository,
    BuildImageInventoryRepository,
)
from infra.repositories import NfsInputRepository
from core.build_image.services import (
    BuildImageConfigService,
    BuildImageQueueService,
)
from core.build_image.value_objects import (
    Architecture,
    ImageKey,
    FunctionalGroups,
    InventoryHost,
)
from core.localrepo.value_objects import (
    ExecutionTimeout,
    ExtraVars,
    PlaybookPath,
)
from core.jobs.entities import AuditEvent, Stage
from core.jobs.exceptions import (
    JobNotFoundError,
    StageNotFoundError,
    StageAlreadyCompletedError,
    InvalidStateTransitionError,
    UpstreamStageNotCompletedError,
)
from core.jobs.repositories import (
    AuditEventRepository,
    JobRepository,
    StageRepository,
    UUIDGenerator,
)
from core.jobs.services import JobStateHelper
from core.jobs.value_objects import (
    StageName,
    StageType,
    StageState,
)

from orchestrator.build_image.commands import CreateBuildImageCommand
from orchestrator.build_image.dtos import BuildImageResponse

logger = logging.getLogger(__name__)

PLAYBOOK_PATHS = {
    "x86_64": "/omnia/build_image_x86_64/build_image_x86_64.yml",
    "aarch64": "/omnia/build_image_aarch64/build_image_aarch64.yml",
}

DEFAULT_TIMEOUT_MINUTES = 60


class CreateBuildImageUseCase:
    """Use case for triggering the build-image stage.

    This use case orchestrates stage execution with the following guarantees:
    - Stage guard enforcement: Only PENDING stages can be started
    - Job ownership verification: Client must own the job
    - Architecture validation: Only x86_64 and aarch64 supported
    - Inventory host validation: Required for aarch64 builds
    - Inventory file creation: Creates inventory file for aarch64 builds
    - Audit trail: Emits STAGE_STARTED event
    - NFS queue submission: Submits playbook request to NFS queue for watcher service

    Attributes:
        job_repo: Job repository port.
        stage_repo: Stage repository port.
        audit_repo: Audit event repository port.
        config_service: Build image configuration service.
        queue_service: Build image queue service.
        inventory_repo: Build image inventory repository.
        uuid_generator: UUID generator for events and request IDs.
    """

    def __init__(
        self,
        job_repo: JobRepository,
        stage_repo: StageRepository,
        audit_repo: AuditEventRepository,
        config_service: BuildImageConfigService,
        queue_service: BuildImageQueueService,
        inventory_repo: NfsInputRepository,
        uuid_generator: UUIDGenerator,
    ) -> None:  # pylint: disable=too-many-arguments,too-many-positional-arguments
        """Initialize use case with repository and service dependencies.

        Args:
            job_repo: Job repository implementation.
            stage_repo: Stage repository implementation.
            audit_repo: Audit event repository implementation.
            config_service: Build image configuration service.
            queue_service: Build image queue service.
            inventory_repo: Build image inventory repository.
            uuid_generator: UUID generator for identifiers.
        """
        self._job_repo = job_repo
        self._stage_repo = stage_repo
        self._audit_repo = audit_repo
        self._config_service = config_service
        self._queue_service = queue_service
        self._inventory_repo = inventory_repo
        self._uuid_generator = uuid_generator

    def execute(self, command: CreateBuildImageCommand) -> BuildImageResponse:
        """Execute the build-image stage.

        Args:
            command: CreateBuildImage command with job details.

        Returns:
            BuildImageResponse DTO with acceptance details.

        Raises:
            JobNotFoundError: If job does not exist or client mismatch.
            InvalidStateTransitionError: If stage is not in PENDING state.
            InvalidArchitectureError: If architecture is not supported.
            InvalidImageKeyError: If image key format is invalid.
            InvalidFunctionalGroupsError: If functional groups are invalid.
            InventoryHostMissingError: If aarch64 requires host but none configured.
            QueueUnavailableError: If NFS queue is not accessible.
        """
        self._validate_job(command)
        architecture = self._validate_architecture(command)
        stage = self._validate_stage(command, architecture)
        image_key = self._validate_image_key(command)
        functional_groups = self._validate_functional_groups(command)

        inventory_host = self._get_inventory_host(command, architecture, stage)
        
        # Create inventory file for aarch64 builds
        inventory_file_path = None
        if inventory_host:
            inventory_file_path = self._create_inventory_file(
                command, inventory_host, stage
            )

        request = self._build_playbook_request(
            command,
            architecture,
            image_key,
            functional_groups,
            inventory_file_path,
        )
        self._submit_to_queue(command, request, stage, architecture)

        self._emit_stage_started_event(command, architecture, image_key)

        return self._to_response(command, request, architecture, image_key)

    def _validate_job(self, command: CreateBuildImageCommand):
        """Validate job exists and belongs to the requesting client."""
        job = self._job_repo.find_by_id(command.job_id)
        if job is None or job.tombstoned:
            raise JobNotFoundError(
                job_id=str(command.job_id),
                correlation_id=str(command.correlation_id),
            )

        if job.client_id != command.client_id:
            raise JobNotFoundError(
                job_id=str(command.job_id),
                correlation_id=str(command.correlation_id),
            )

        return job

    def _verify_upstream_stage_completed(
        self, command: CreateBuildImageCommand
    ) -> None:
        """Verify that create-local-repository stage is COMPLETED."""
        from core.jobs.value_objects import StageState
        
        prerequisite_stage = self._stage_repo.find_by_job_and_name(
            command.job_id, 
            StageName(StageType.CREATE_LOCAL_REPOSITORY.value)
        )
        if (
            prerequisite_stage is None
            or prerequisite_stage.stage_state != StageState.COMPLETED
        ):
            raise UpstreamStageNotCompletedError(
                job_id=str(command.job_id),
                required_stage="create-local-repository",
                actual_state=(
                    prerequisite_stage.stage_state.value
                    if prerequisite_stage
                    else "NOT_FOUND"
                ),
                correlation_id=str(command.correlation_id),
            )

    def _validate_stage(self, command: CreateBuildImageCommand, architecture: Architecture) -> Stage:
        """Validate stage exists and is in PENDING state."""
        
        # Verify upstream stage is completed
        self._verify_upstream_stage_completed(command)
        
        # Use architecture-specific stage type
        if architecture.is_x86_64:
            stage_type = StageType.BUILD_IMAGE_X86_64
        else:
            stage_type = StageType.BUILD_IMAGE_AARCH64
            
        stage_name = StageName(stage_type.value)
        stage = self._stage_repo.find_by_job_and_name(command.job_id, stage_name)

        if stage is None:
            raise StageNotFoundError(
                job_id=str(command.job_id),
                stage_name=stage_type.value,
                correlation_id=str(command.correlation_id),
            )
        
        # Only allow PENDING stages to transition to IN_PROGRESS
        if stage.stage_state == StageState.COMPLETED:
            raise StageAlreadyCompletedError(
                job_id=str(command.job_id),
                stage_name=stage_type.value,
                correlation_id=str(command.correlation_id),
            )
        
        if stage.stage_state != StageState.PENDING:
            raise InvalidStateTransitionError(
                entity_type="Stage",
                entity_id=f"{command.job_id}/{stage_type.value}",
                from_state=stage.stage_state.value,
                to_state="IN_PROGRESS",
                correlation_id=str(command.correlation_id),
            )

        return stage

    def _validate_architecture(
        self,
        command: CreateBuildImageCommand,
    ) -> Architecture:
        """Validate and create Architecture value object."""
        try:
            return Architecture(command.architecture)
        except ValueError as exc:
            raise InvalidArchitectureError(
                message=str(exc),
                correlation_id=str(command.correlation_id),
            ) from exc

    def _validate_image_key(self, command: CreateBuildImageCommand) -> ImageKey:
        """Validate and create ImageKey value object."""
        try:
            return ImageKey(command.image_key)
        except ValueError as exc:
            raise InvalidImageKeyError(
                message=str(exc),
                correlation_id=str(command.correlation_id),
            ) from exc

    def _validate_functional_groups(
        self,
        command: CreateBuildImageCommand,
    ) -> FunctionalGroups:
        """Validate and create FunctionalGroups value object."""
        try:
            return FunctionalGroups(command.functional_groups)
        except ValueError as exc:
            raise InvalidFunctionalGroupsError(
                message=str(exc),
                correlation_id=str(command.correlation_id),
            ) from exc

    def _get_inventory_host(
        self,
        command: CreateBuildImageCommand,
        architecture: Architecture,
        stage: Stage,
    ):
        """Get inventory host for aarch64 builds from config service.

        Inventory host is retrieved internally from build_stream_config.yml
        and should not be provided in the API request.

        If inventory host retrieval fails, the stage is transitioned to FAILED
        and the error is re-raised to prevent playbook invocation.
        """
        try:
            return self._config_service.get_inventory_host(
                job_id=str(command.job_id),
                architecture=architecture,
                correlation_id=str(command.correlation_id),
            )
        except InventoryHostMissingError as exc:
            try:
                error_code = "INVENTORY_HOST_MISSING"
                error_summary = exc.message
                stage.start()
                stage.fail(
                    error_code=error_code,
                    error_summary=error_summary,
                )
                self._stage_repo.save(stage)
                
                # Update job state to FAILED when stage fails
                JobStateHelper.handle_stage_failure(
                    job_repo=self._job_repo,
                    audit_repo=self._audit_repo,
                    uuid_generator=self._uuid_generator,
                    job_id=command.job_id,
                    stage_name=str(stage.stage_name),
                    error_code=error_code,
                    error_summary=error_summary,
                    correlation_id=str(command.correlation_id),
                    client_id=str(command.client_id),
                )
            except Exception as save_exc:
                # If save fails, stage was modified elsewhere
                log_secure_info(
                    "Stage fail save failed, stage already modified elsewhere: %s",
                    str(save_exc)
                )
            log_secure_info(
                "error",
                f"Inventory host missing for job {command.job_id}",
                str(command.correlation_id),
            )
            raise

    def _create_inventory_file(
        self,
        command: CreateBuildImageCommand,
        inventory_host: InventoryHost,
        stage: Stage,
    ) -> Optional[Path]:
        """Create inventory file for aarch64 builds.

        Args:
            command: CreateBuildImage command.
            inventory_host: Inventory host IP.
            stage: Current stage entity.

        Returns:
            Path to created inventory file.

        Raises:
            IOError: If inventory file creation fails.
        """
        try:
            inventory_file_path = self._inventory_repo.create_inventory_file(
                inventory_host=inventory_host,
                job_id=str(command.job_id),
            )
            logger.info(
                "Created inventory file for job %s at %s",
                command.job_id,
                inventory_file_path,
            )
            return inventory_file_path
        except IOError as exc:
            # Refresh stage from database to avoid OptimisticLockError
            fresh_stage = self._stage_repo.find_by_job_and_name(
                command.job_id,
                stage.stage_name
            )
            if fresh_stage:
                error_code = "INVENTORY_FILE_CREATION_FAILED"
                error_summary = f"Failed to create inventory file: {str(exc)}"
                fresh_stage.start()
                fresh_stage.fail(
                    error_code=error_code,
                    error_summary=error_summary,
                )
                
                # Update job state to FAILED when stage fails
                JobStateHelper.handle_stage_failure(
                    job_repo=self._job_repo,
                    audit_repo=self._audit_repo,
                    uuid_generator=self._uuid_generator,
                    job_id=command.job_id,
                    stage_name=str(fresh_stage.stage_name),
                    error_code=error_code,
                    error_summary=error_summary,
                    correlation_id=str(command.correlation_id),
                    client_id=str(command.client_id),
                )
                self._stage_repo.save(fresh_stage)
            log_secure_info(
                "error",
                f"Failed to create inventory file for job {command.job_id}",
                str(command.correlation_id),
            )
            raise

    def _build_playbook_request(
        self,
        command: CreateBuildImageCommand,
        architecture: Architecture,
        image_key: ImageKey,
        functional_groups: FunctionalGroups,
        inventory_file_path: Optional[Path],
    ) -> BuildImageRequest:
        """Compatibility shim matching historical naming used by execute()."""
        return self._create_request(
            command,
            architecture,
            image_key,
            functional_groups,
            inventory_file_path,
        )

    def _create_request(
        self,
        command: CreateBuildImageCommand,
        architecture: Architecture,
        image_key: ImageKey,
        functional_groups: FunctionalGroups,
        inventory_file_path: Optional[Path],
    ) -> BuildImageRequest:
        """Create BuildImageRequest entity."""
        # Determine playbook path based on architecture
        full_path = PLAYBOOK_PATHS[architecture.value]
        playbook_name = full_path.split("/")[-1]  # Extract filename from full path
        playbook_path = PlaybookPath(playbook_name)

        # Build extra vars dictionary
        extra_vars_dict = {
            "job_id": str(command.job_id),
            "image_key": str(image_key),
            "functional_groups": functional_groups.to_list(),
        }

        extra_vars = ExtraVars(extra_vars_dict)

        return BuildImageRequest(
            job_id=str(command.job_id),
            stage_name="build-image-x86_64" if architecture.is_x86_64 else "build-image-aarch64",
            playbook_path=playbook_path,
            extra_vars=extra_vars,
            inventory_file_path=str(inventory_file_path) if inventory_file_path else None,
            correlation_id=str(command.correlation_id),
            timeout=ExecutionTimeout(60),  # TODO: Make configurable
            submitted_at=datetime.now(timezone.utc).isoformat().replace("+00:00", "Z"),
            request_id=str(self._uuid_generator.generate()),
        )

    def _submit_to_queue(
        self,
        command: CreateBuildImageCommand,
        request: BuildImageRequest,
        stage: Stage,
        architecture: Architecture,
    ) -> None:
        """Submit playbook request to NFS queue for watcher service."""
        stage.start()
        self._stage_repo.save(stage)

        self._queue_service.submit_request(
            request=request,
            correlation_id=str(command.correlation_id),
        )

        # Use architecture-specific stage type for logging
        stage_type = StageType.BUILD_IMAGE_X86_64 if architecture.is_x86_64 else StageType.BUILD_IMAGE_AARCH64
        logger.info(
            "Build image request submitted to queue for job %s, stage=%s, "
            "arch=%s, correlation_id=%s",
            command.job_id,
            stage_type.value,
            str(architecture),
            command.correlation_id,
        )

    def _emit_stage_started_event(
        self,
        command: CreateBuildImageCommand,
        architecture: Architecture,
        image_key: ImageKey,
    ) -> None:
        """Emit an audit event for stage start."""
        # Use architecture-specific stage type for audit event
        stage_type = StageType.BUILD_IMAGE_X86_64 if architecture.is_x86_64 else StageType.BUILD_IMAGE_AARCH64
        event = AuditEvent(
            event_id=str(self._uuid_generator.generate()),
            job_id=command.job_id,
            event_type="STAGE_STARTED",
            correlation_id=command.correlation_id,
            client_id=command.client_id,
            timestamp=datetime.now(timezone.utc),
            details={
                "stage_name": stage_type.value,
                "architecture": str(architecture),
                "image_key": str(image_key),
            },
        )
        self._audit_repo.save(event)

    def _to_response(
        self,
        command: CreateBuildImageCommand,
        request: BuildImageRequest,
        architecture: Architecture,
        image_key: ImageKey,
    ) -> BuildImageResponse:
        """Map to response DTO."""
        # Use architecture-specific stage type for response
        stage_type = StageType.BUILD_IMAGE_X86_64 if architecture.is_x86_64 else StageType.BUILD_IMAGE_AARCH64
        return BuildImageResponse(
            job_id=str(command.job_id),
            stage_name=stage_type.value,
            status="accepted",
            submitted_at=request.submitted_at,
            correlation_id=str(command.correlation_id),
            architecture=str(architecture),
            image_key=str(image_key),
            functional_groups=command.functional_groups,
        )


================================================
FILE: build_stream/orchestrator/catalog/commands/generate_input_files.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""GenerateInputFiles command DTO."""

from dataclasses import dataclass
from typing import ClassVar, Optional

from core.artifacts.value_objects import SafePath
from core.jobs.value_objects import CorrelationId, JobId


@dataclass(frozen=True)
class GenerateInputFilesCommand:
    """Command to execute the generate-input-files stage.

    Attributes:
        job_id: Job identifier (validated UUID).
        correlation_id: Request correlation identifier for tracing.
        adapter_policy_path: Optional custom adapter policy path.
                             If None, the default policy is used.
    """

    job_id: JobId
    correlation_id: CorrelationId
    adapter_policy_path: Optional[SafePath] = None


================================================
FILE: build_stream/orchestrator/catalog/commands/parse_catalog.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""ParseCatalog command DTO."""

from dataclasses import dataclass
from typing import ClassVar

from core.jobs.value_objects import CorrelationId, JobId


@dataclass(frozen=True)
class ParseCatalogCommand:
    """Command to execute the parse-catalog stage.

    Attributes:
        job_id: Job identifier (validated UUID).
        correlation_id: Request correlation identifier for tracing.
        filename: Name of the uploaded catalog file.
        content: Raw bytes of the uploaded catalog file.
    """

    job_id: JobId
    correlation_id: CorrelationId
    filename: str
    content: bytes

    FILENAME_MAX_LENGTH: ClassVar[int] = 255
    MAX_CONTENT_SIZE: ClassVar[int] = 5 * 1024 * 1024  # 5 MB

    def __post_init__(self) -> None:
        """Validate command fields."""
        if not self.filename or not self.filename.strip():
            raise ValueError("filename cannot be empty")
        if len(self.filename) > self.FILENAME_MAX_LENGTH:
            raise ValueError(
                f"filename must be <= {self.FILENAME_MAX_LENGTH} chars, "
                f"got {len(self.filename)}"
            )
        if not self.content:
            raise ValueError("content cannot be empty")
        if len(self.content) > self.MAX_CONTENT_SIZE:
            raise ValueError(
                f"content size {len(self.content)} bytes exceeds maximum "
                f"{self.MAX_CONTENT_SIZE} bytes"
            )


================================================
FILE: build_stream/orchestrator/catalog/dtos.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Response DTOs for catalog orchestrator use cases."""

from dataclasses import dataclass, field
from typing import List, Tuple

from core.artifacts.value_objects import ArtifactRef


@dataclass
class ParseCatalogResult:
    """Result DTO for ParseCatalogUseCase."""

    job_id: str
    stage_state: str
    message: str
    catalog_ref: ArtifactRef
    root_jsons_ref: ArtifactRef
    root_json_count: int
    arch_os_combinations: List[Tuple[str, str, str]]
    completed_at: str  # ISO 8601


@dataclass
class GenerateInputFilesResult:
    """Result DTO for GenerateInputFilesUseCase."""

    job_id: str
    stage_state: str
    message: str
    configs_ref: ArtifactRef = field(metadata={"exclude": True})  # Exclude from JSON response
    config_file_count: int = field(metadata={"exclude": True})  # Exclude from JSON response
    config_files: List[str] = field(metadata={"exclude": True})  # Exclude from JSON response
    arch_os_combinations: List[Tuple[str, str, str]] = field(metadata={"exclude": True})  # Exclude from JSON response
    completed_at: str = field(metadata={"exclude": True})  # Exclude from JSON response


================================================
FILE: build_stream/orchestrator/catalog/use_cases/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Catalog orchestrator use cases."""

from orchestrator.catalog.use_cases.parse_catalog import ParseCatalogUseCase
from orchestrator.catalog.use_cases.generate_input_files import GenerateInputFilesUseCase

__all__ = [
    "ParseCatalogUseCase",
    "GenerateInputFilesUseCase",
]


================================================
FILE: build_stream/orchestrator/catalog/use_cases/generate_input_files.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

# pylint: disable=too-many-arguments,too-many-positional-arguments

"""GenerateInputFiles use case implementation."""

import logging
import os
import tempfile
from datetime import datetime, timezone
from pathlib import Path
from typing import Dict, List, Tuple

from core.artifacts.entities import ArtifactRecord
from core.artifacts.exceptions import ArtifactNotFoundError
from core.artifacts.ports import ArtifactMetadataRepository, ArtifactStore
from core.artifacts.value_objects import (
    ArtifactKind,
    ArtifactRef,
    SafePath,
    StoreHint,
)
from core.catalog.adapter_policy import generate_configs_from_policy
from core.catalog.exceptions import (
    AdapterPolicyValidationError,
    ConfigGenerationError,
)
from common.config import load_config
from core.jobs.entities import AuditEvent, Job, Stage
from core.jobs.exceptions import (
    InvalidStateTransitionError,
    JobNotFoundError,
    StageAlreadyCompletedError,
    TerminalStateViolationError,
    UpstreamStageNotCompletedError,
)
from core.jobs.repositories import (
    AuditEventRepository,
    JobRepository,
    StageRepository,
    UUIDGenerator,
)
from core.jobs.services import JobStateHelper
from core.jobs.value_objects import JobId, StageName, StageType, StageState, JobState

from orchestrator.catalog.commands.generate_input_files import GenerateInputFilesCommand
from orchestrator.catalog.dtos import GenerateInputFilesResult

logger = logging.getLogger(__name__)


class GenerateInputFilesUseCase:
    """Use case for executing the generate-input-files stage.

    Orchestrates:
    1. Stage guard validation (parse-catalog COMPLETED, this stage PENDING)
    2. Upstream artifact retrieval (root JSONs from parse-catalog)
    3. Adapter policy loading and validation
    4. Omnia config generation via adapter policy engine
    5. Output artifact storage (configs archive)
    6. Artifact metadata persistence
    7. Stage state transitions and audit events
    """

    def __init__(
        self,
        job_repo: JobRepository,
        stage_repo: StageRepository,
        audit_repo: AuditEventRepository,
        artifact_store: ArtifactStore,
        artifact_metadata_repo: ArtifactMetadataRepository,
        uuid_generator: UUIDGenerator,
        default_policy_path: SafePath,
        policy_schema_path: SafePath,
    ) -> None:
        self._job_repo = job_repo
        self._stage_repo = stage_repo
        self._audit_repo = audit_repo
        self._artifact_store = artifact_store
        self._artifact_metadata_repo = artifact_metadata_repo
        self._uuid_generator = uuid_generator
        self._default_policy_path = default_policy_path
        self._policy_schema_path = policy_schema_path
        self._current_job: Job | None = None

    def execute(
        self, command: GenerateInputFilesCommand
    ) -> GenerateInputFilesResult:
        """Execute the generate-input-files stage."""
        job, stage = self._load_and_guard_stage(command)
        self._current_job = job
        self._verify_upstream_stage_completed(command)

        try:
            self._mark_stage_started(job, stage, command)
            with tempfile.TemporaryDirectory(
                prefix=f"gif-{command.job_id}-"
            ) as tmp_dir:
                root_jsons_dir = self._retrieve_upstream_artifacts(
                    command, Path(tmp_dir)
                )
                policy_path = self._resolve_policy_path(command)
                config_output_dir = self._generate_omnia_configs(
                    root_jsons_dir, policy_path, Path(tmp_dir)
                )
                configs_ref, configs_record = self._store_output_artifacts(
                    command, config_output_dir
                )
                self._copy_configs_to_artifacts_input_dir(command, config_output_dir)

                self._mark_stage_completed(stage, command)
                return self._build_success_result(
                    command, configs_ref, configs_record, config_output_dir
                )
        except Exception as e:
            self._mark_stage_failed(stage, command, e)
            raise

    # ------------------------------------------------------------------
    # Stage guards
    # ------------------------------------------------------------------

    def _load_and_guard_stage(
        self, command: GenerateInputFilesCommand
    ) -> Tuple[Job, Stage]:
        """Load job and generate-input-files stage, enforce preconditions."""
        job = self._job_repo.find_by_id(command.job_id)
        if job is None:
            raise JobNotFoundError(
                job_id=str(command.job_id),
                correlation_id=str(command.correlation_id),
            )

        if job.job_state.is_terminal():
            raise TerminalStateViolationError(
                entity_type="Job",
                entity_id=str(command.job_id),
                state=job.job_state.value,
                correlation_id=str(command.correlation_id),
            )

        stage = self._stage_repo.find_by_job_and_name(
            command.job_id, StageName(StageType.GENERATE_INPUT_FILES.value)
        )
        if stage is None:
            raise JobNotFoundError(
                job_id=str(command.job_id),
                correlation_id=str(command.correlation_id),
            )

        if stage.stage_state == StageState.COMPLETED:
            raise StageAlreadyCompletedError(
                job_id=str(command.job_id),
                stage_name="generate-input-files",
                correlation_id=str(command.correlation_id),
            )

        if stage.stage_state != StageState.PENDING:
            raise InvalidStateTransitionError(
                entity_type="Stage",
                entity_id=f"{command.job_id}/generate-input-files",
                from_state=stage.stage_state.value,
                to_state="IN_PROGRESS",
                correlation_id=str(command.correlation_id),
            )

        return job, stage

    def _verify_upstream_stage_completed(
        self, command: GenerateInputFilesCommand
    ) -> None:
        """Verify that parse-catalog stage is COMPLETED."""
        parse_stage = self._stage_repo.find_by_job_and_name(
            command.job_id, StageName(StageType.PARSE_CATALOG.value)
        )
        if (
            parse_stage is None
            or parse_stage.stage_state != StageState.COMPLETED
        ):
            raise UpstreamStageNotCompletedError(
                job_id=str(command.job_id),
                required_stage="parse-catalog",
                actual_state=(
                    parse_stage.stage_state.value
                    if parse_stage
                    else "NOT_FOUND"
                ),
                correlation_id=str(command.correlation_id),
            )

    # ------------------------------------------------------------------
    # Artifact retrieval
    # ------------------------------------------------------------------

    def _retrieve_upstream_artifacts(
        self, command: GenerateInputFilesCommand, tmp_base: Path
    ) -> Path:
        """Retrieve root JSONs archive from ArtifactStore and unpack."""
        record = self._artifact_metadata_repo.find_by_job_stage_and_label(
            job_id=command.job_id,
            stage_name=StageName(StageType.PARSE_CATALOG.value),
            label="root-jsons",
        )
        if record is None:
            raise ArtifactNotFoundError(
                key=f"root-jsons for job {command.job_id}",
                correlation_id=str(command.correlation_id),
            )

        destination = tmp_base / "root-jsons"
        return self._artifact_store.retrieve(
            key=record.artifact_ref.key,
            kind=ArtifactKind.ARCHIVE,
            destination=destination,
        )

    # ------------------------------------------------------------------
    # Config generation
    # ------------------------------------------------------------------

    def _resolve_policy_path(
        self, command: GenerateInputFilesCommand
    ) -> str:
        """Resolve the adapter policy path."""
        if command.adapter_policy_path is not None:
            policy_path = str(command.adapter_policy_path.value)
        else:
            policy_path = str(self._default_policy_path.value)

        if not os.path.isfile(policy_path):
            raise FileNotFoundError(f"Adapter policy not found: {policy_path}")
        return policy_path

    def _generate_omnia_configs(
        self,
        root_jsons_dir: Path,
        policy_path: str,
        tmp_base: Path,
    ) -> Path:
        """Generate Omnia config files using the adapter policy engine."""
        output_dir = tmp_base / "omnia-configs"
        output_dir.mkdir(parents=True, exist_ok=True)

        try:
            generate_configs_from_policy(
                input_dir=str(root_jsons_dir),
                output_dir=str(output_dir),
                policy_path=policy_path,
                schema_path=str(self._policy_schema_path.value),
            )
        except ValueError as e:
            raise AdapterPolicyValidationError(str(e)) from e
        except FileNotFoundError:
            raise
        except Exception as e:
            raise ConfigGenerationError(
                f"Config generation failed: {e}"
            ) from e

        # Check if any files were generated
        has_files = any(
            filename.endswith(".json")
            for root, _dirs, files in os.walk(str(output_dir))
            for filename in files
        )

        if not has_files:
            raise ConfigGenerationError(
                "No config files generated. Check adapter policy and root JSONs."
            )

        return output_dir

    # ------------------------------------------------------------------
    # Artifact storage
    # ------------------------------------------------------------------

    def _store_output_artifacts(
        self,
        command: GenerateInputFilesCommand,
        config_output_dir: Path,
    ) -> Tuple[ArtifactRef, ArtifactRecord]:
        """Store generated configs as archive artifact and persist metadata."""
        # Check if artifact already exists (idempotency handling)
        existing_record = self._artifact_metadata_repo.find_by_job_stage_and_label(
            job_id=command.job_id,
            stage_name=StageName(StageType.GENERATE_INPUT_FILES.value),
            label="omnia-configs",
        )
        if existing_record is not None:
            logger.info(
                "Artifact already exists for job %s, returning existing record: %s",
                command.job_id,
                existing_record.artifact_ref.key.value,
            )
            return existing_record.artifact_ref, existing_record

        hint = StoreHint(
            namespace="input-files",
            label="omnia-configs",
            tags={"job_id": str(command.job_id)},
        )

        configs_ref = self._artifact_store.store(
            hint=hint,
            kind=ArtifactKind.ARCHIVE,
            source_directory=config_output_dir,
            content_type="application/zip",
        )

        record = ArtifactRecord(
            id=str(self._uuid_generator.generate()),
            job_id=command.job_id,
            stage_name=StageName(StageType.GENERATE_INPUT_FILES.value),
            label="omnia-configs",
            artifact_ref=configs_ref,
            kind=ArtifactKind.ARCHIVE,
            content_type="application/zip",
            tags={
                "job_id": str(command.job_id),
            },
        )
        self._artifact_metadata_repo.save(record)

        return configs_ref, record

    def _copy_configs_to_artifacts_input_dir(
        self,
        command: GenerateInputFilesCommand,
        config_output_dir: Path,
    ) -> None:
        """Copy generated config files to artifacts/{job_id}/ directory.
        
        This creates a copy of the generated input files in the expected location
        for the NfsInputDirectoryRepository to consume.
        
        Args:
            command: Generate input files command.
            config_output_dir: Directory containing generated config files.
        """
        import shutil
        
        # Load config and get artifacts base path from configuration
        config = load_config()
        artifacts_base = Path(config.file_store.base_path)
        target_dir = artifacts_base / str(command.job_id)
        
        # Create target directory if it doesn't exist
        target_dir.mkdir(parents=True, exist_ok=True)
        
        # Copy all contents from config_output_dir to target_dir
        for item in config_output_dir.iterdir():
            if item.is_file():
                shutil.copy2(item, target_dir / item.name)
            elif item.is_dir():
                shutil.copytree(item, target_dir / item.name, dirs_exist_ok=True)
        
        logger.info(
            "Copied generated configs to artifacts input directory: %s",
            target_dir
        )

    # ------------------------------------------------------------------
    # State transitions
    # ------------------------------------------------------------------

    def _mark_stage_started(
        self, job: Job, stage: Stage, command: GenerateInputFilesCommand
    ) -> None:
        """Transition stage to IN_PROGRESS."""
        stage.start()
        self._stage_repo.save(stage)
        self._emit_audit_event(
            command, "STAGE_STARTED",
            {"stage_name": "generate-input-files"},
        )

    def _mark_stage_completed(
        self, stage: Stage, command: GenerateInputFilesCommand
    ) -> None:
        """Transition stage to COMPLETED."""
        stage.complete()
        self._stage_repo.save(stage)
        self._emit_audit_event(
            command, "STAGE_COMPLETED",
            {"stage_name": "generate-input-files"},
        )

    def _mark_stage_failed(
        self, stage: Stage, command: GenerateInputFilesCommand, error: Exception
    ) -> None:
        """Transition stage to FAILED with error details."""
        error_code = type(error).__name__
        error_summary = "Processing failed"
        stage.fail(error_code=error_code, error_summary=error_summary)
        self._stage_repo.save(stage)
        self._emit_audit_event(
            command, "STAGE_FAILED",
            {
                "stage_name": "generate-input-files",
                "error_code": error_code,
                "error_summary": error_summary,
            },
        )
        
        # Update job state to FAILED when stage fails
        JobStateHelper.handle_stage_failure(
            job_repo=self._job_repo,
            audit_repo=self._audit_repo,
            uuid_generator=self._uuid_generator,
            job_id=command.job_id,
            stage_name="generate-input-files",
            error_code=error_code,
            error_summary=error_summary,
            correlation_id=str(command.correlation_id),
            client_id=str(command.client_id),
        )

    # ------------------------------------------------------------------
    # Audit
    # ------------------------------------------------------------------

    def _emit_audit_event(
        self,
        command: GenerateInputFilesCommand,
        event_type: str,
        details: dict,
    ) -> None:
        """Emit an audit event."""
        from core.jobs.value_objects import ClientId
        client_id = (
            self._current_job.client_id
            if self._current_job is not None
            else ClientId("unknown")
        )
        event = AuditEvent(
            event_id=str(self._uuid_generator.generate()),
            job_id=command.job_id,
            event_type=event_type,
            correlation_id=command.correlation_id,
            client_id=client_id,
            timestamp=datetime.now(timezone.utc),
            details=details,
        )
        self._audit_repo.save(event)

    # ------------------------------------------------------------------
    # Result building
    # ------------------------------------------------------------------

    def _build_success_result(
        self,
        command: GenerateInputFilesCommand,
        configs_ref: ArtifactRef,
        configs_record: ArtifactRecord,
        config_output_dir: Path,
    ) -> GenerateInputFilesResult:
        """Build minimal success result with only essential fields."""
        return GenerateInputFilesResult(
            job_id=str(command.job_id),
            stage_state="COMPLETED",
            message="Input files generated successfully",
            configs_ref=configs_ref,
            config_file_count=0,  # Not included in minimal response
            config_files=[],      # Not included in minimal response
            arch_os_combinations=[],  # Not included in minimal response
            completed_at="",     # Not included in minimal response
        )


================================================
FILE: build_stream/orchestrator/catalog/use_cases/parse_catalog.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

# pylint: disable=too-many-arguments,too-many-positional-arguments

"""ParseCatalog use case implementation."""

import json
import logging
import tempfile
from datetime import datetime, timezone
from pathlib import Path
from typing import Dict, Tuple

import hashlib

from jsonschema import ValidationError

from core.artifacts.entities import ArtifactRecord
from core.artifacts.exceptions import ArtifactAlreadyExistsError
from core.artifacts.interfaces import ArtifactMetadataRepository, ArtifactStore
from core.artifacts.value_objects import ArtifactDigest, ArtifactKind, ArtifactRef, StoreHint
from core.catalog.exceptions import (
    CatalogSchemaValidationError,
    InvalidFileFormatError,
    InvalidJSONError,
)
from core.catalog.generator import generate_root_json_from_catalog
from core.jobs.entities import AuditEvent, Job, Stage
from core.jobs.exceptions import (
    InvalidStateTransitionError,
    JobNotFoundError,
    StageAlreadyCompletedError,
    TerminalStateViolationError,
)
from core.jobs.repositories import (
    AuditEventRepository,
    JobRepository,
    StageRepository,
    UUIDGenerator,
)
from core.jobs.services import JobStateHelper
from core.jobs.value_objects import (
    ClientId,
    StageName,
    StageState,
    StageType,
    JobState,
)

from orchestrator.catalog.commands.parse_catalog import ParseCatalogCommand
from orchestrator.catalog.dtos import ParseCatalogResult

logger = logging.getLogger(__name__)


class ParseCatalogUseCase:  # pylint: disable=too-few-public-methods
    """Use case for executing the parse-catalog stage.

    Orchestrates:
    1. Stage guard validation (job exists, stage PENDING)
    2. Catalog validation (format, JSON, schema)
    3. Root JSON generation via existing generator
    4. Artifact storage (catalog file + root JSONs archive)
    5. Artifact metadata persistence
    6. Stage state transitions and audit events
    """

    def __init__(
        self,
        job_repo: JobRepository,
        stage_repo: StageRepository,
        audit_repo: AuditEventRepository,
        artifact_store: ArtifactStore,
        artifact_metadata_repo: ArtifactMetadataRepository,
        uuid_generator: UUIDGenerator,
    ) -> None:
        self._job_repo = job_repo
        self._stage_repo = stage_repo
        self._audit_repo = audit_repo
        self._artifact_store = artifact_store
        self._artifact_metadata_repo = artifact_metadata_repo
        self._uuid_generator = uuid_generator
        self._current_job: Job | None = None

    def execute(self, command: ParseCatalogCommand) -> ParseCatalogResult:
        """Execute the parse-catalog stage.

        Args:
            command: ParseCatalogCommand with job_id, filename, content.

        Returns:
            ParseCatalogResult with stage outcome and artifact references.

        Raises:
            JobNotFoundError: If job does not exist.
            InvalidStateTransitionError: If job/stage not in valid state.
            StageAlreadyCompletedError: If stage already completed.
            InvalidFileFormatError: If file is not JSON.
            InvalidJSONError: If content is not valid JSON dict.
            CatalogSchemaValidationError: If catalog fails schema validation.
            ArtifactStoreError: If artifact storage fails.
        """
        job, stage = self._load_and_guard_stage(command)
        self._current_job = job

        # Idempotency: if stage already completed, return existing result
        existing = self._check_idempotent_completion(command, stage)
        if existing is not None:
            return existing

        try:
            self._mark_stage_started(job, stage, command)
            self._validate_file_format(command.filename)
            catalog_data = self._parse_and_validate_json(command.content)
            catalog_ref = self._store_catalog_artifact(command)
            root_jsons_ref = self._generate_and_store_root_jsons(
                command, catalog_data
            )
            self._mark_stage_completed(stage, command)
            return self._build_success_result(
                command, catalog_ref, root_jsons_ref
            )
        except Exception as e:
            self._mark_stage_failed(stage, command, e)
            raise

    # ------------------------------------------------------------------
    # Stage guards
    # ------------------------------------------------------------------

    def _load_and_guard_stage(
        self, command: ParseCatalogCommand
    ) -> Tuple[Job, Stage]:
        """Load job and parse-catalog stage, enforce preconditions."""
        job = self._job_repo.find_by_id(command.job_id)
        if job is None:
            raise JobNotFoundError(
                job_id=str(command.job_id),
                correlation_id=str(command.correlation_id),
            )

        if job.job_state.is_terminal():
            raise TerminalStateViolationError(
                entity_type="Job",
                entity_id=str(command.job_id),
                state=job.job_state.value,
                correlation_id=str(command.correlation_id),
            )

        stage = self._stage_repo.find_by_job_and_name(
            command.job_id, StageName(StageType.PARSE_CATALOG.value)
        )
        if stage is None:
            raise JobNotFoundError(
                job_id=str(command.job_id),
                correlation_id=str(command.correlation_id),
            )

        if stage.stage_state == StageState.COMPLETED:
            raise StageAlreadyCompletedError(
                job_id=str(command.job_id),
                stage_name="parse-catalog",
                correlation_id=str(command.correlation_id),
            )

        if stage.stage_state != StageState.PENDING:
            raise InvalidStateTransitionError(
                entity_type="Stage",
                entity_id=f"{command.job_id}/parse-catalog",
                from_state=stage.stage_state.value,
                to_state="IN_PROGRESS",
                correlation_id=str(command.correlation_id),
            )

        return job, stage

    def _check_idempotent_completion(
        self, command: ParseCatalogCommand, stage: Stage
    ) -> ParseCatalogResult | None:
        """If stage already completed with artifacts, return existing result."""
        # Stage guard already rejects COMPLETED, so this is only for
        # future use if we relax the guard for idempotent retries.
        return None

    # ------------------------------------------------------------------
    # Validation
    # ------------------------------------------------------------------

    def _validate_file_format(self, filename: str) -> None:
        """Validate that the file has a .json extension."""
        if not filename.lower().endswith(".json"):
            raise InvalidFileFormatError(
                "Invalid file format. Only JSON files are accepted."
            )

    def _parse_and_validate_json(self, content: bytes) -> dict:
        """Parse JSON content from bytes and validate structure."""
        try:
            data = json.loads(content.decode("utf-8"))
        except json.JSONDecodeError as e:
            raise InvalidJSONError(f"Invalid JSON data: {e.msg}") from e
        except UnicodeDecodeError as e:
            raise InvalidJSONError("File content is not valid UTF-8 text") from e

        if not isinstance(data, dict):
            raise InvalidJSONError(
                "Invalid JSON data. The data must be a dictionary."
            )
        return data

    # ------------------------------------------------------------------
    # Artifact storage
    # ------------------------------------------------------------------

    def _store_catalog_artifact(
        self, command: ParseCatalogCommand
    ) -> ArtifactRef:
        """Store the uploaded catalog file as a FILE artifact."""
        hint = StoreHint(
            namespace="catalog",
            label="catalog-file",
            tags={"job_id": str(command.job_id)},
        )

        try:
            catalog_ref = self._artifact_store.store(
                hint=hint,
                kind=ArtifactKind.FILE,
                content=command.content,
                content_type="application/json",
            )
        except ArtifactAlreadyExistsError:
            # Idempotent: artifact already stored from a previous attempt
            key = self._artifact_store.generate_key(hint, ArtifactKind.FILE)
            raw = self._artifact_store.retrieve(key, ArtifactKind.FILE)
            digest = ArtifactDigest(hashlib.sha256(raw).hexdigest())
            catalog_ref = ArtifactRef(
                key=key, digest=digest, size_bytes=len(raw),
                uri=f"memory://{key.value}",
            )

        record = ArtifactRecord(
            id=str(self._uuid_generator.generate()),
            job_id=command.job_id,
            stage_name=StageName(StageType.PARSE_CATALOG.value),
            label="catalog-file",
            artifact_ref=catalog_ref,
            kind=ArtifactKind.FILE,
            content_type="application/json",
            tags={"job_id": str(command.job_id)},
        )
        self._artifact_metadata_repo.save(record)

        return catalog_ref

    def _generate_and_store_root_jsons(
        self,
        command: ParseCatalogCommand,
        catalog_data: dict,
    ) -> Tuple[ArtifactRef, Dict[str, bytes]]:
        """Generate root JSONs and store as ARCHIVE artifact."""
        with tempfile.TemporaryDirectory(
            prefix=f"parse-catalog-{command.job_id}-"
        ) as tmp_dir:
            tmp_path = Path(tmp_dir)
            catalog_file = tmp_path / "catalog.json"
            catalog_file.write_text(
                json.dumps(catalog_data), encoding="utf-8"
            )

            output_dir = tmp_path / "root_jsons"
            output_dir.mkdir()

            try:
                generate_root_json_from_catalog(
                    catalog_path=str(catalog_file),
                    output_root=str(output_dir),
                )
            except ValidationError as e:
                # Preserve the original validation error message
                error_msg = f"Catalog schema validation failed: {e.message}"
                if e.absolute_path:
                    error_msg += f" at {'/'.join(str(p) for p in e.absolute_path)}"
                raise CatalogSchemaValidationError(error_msg) from e
            except Exception as e:
                raise CatalogSchemaValidationError(
                    f"Catalog processing failed: {e}"
                ) from e

            hint = StoreHint(
                namespace="catalog",
                label="root-jsons",
                tags={"job_id": str(command.job_id)},
            )

            try:
                root_jsons_ref = self._artifact_store.store(
                    hint=hint,
                    kind=ArtifactKind.ARCHIVE,
                    source_directory=output_dir,
                    content_type="application/zip",
                )
            except ArtifactAlreadyExistsError:
                key = self._artifact_store.generate_key(hint, ArtifactKind.ARCHIVE)
                raw = self._artifact_store.retrieve(key, ArtifactKind.FILE)
                digest = ArtifactDigest(hashlib.sha256(raw).hexdigest())
                root_jsons_ref = ArtifactRef(
                    key=key, digest=digest, size_bytes=len(raw),
                    uri=f"memory://{key.value}",
                )

            record = ArtifactRecord(
                id=str(self._uuid_generator.generate()),
                job_id=command.job_id,
                stage_name=StageName(StageType.PARSE_CATALOG.value),
                label="root-jsons",
                artifact_ref=root_jsons_ref,
                kind=ArtifactKind.ARCHIVE,
                content_type="application/zip",
                tags={
                    "job_id": str(command.job_id),
                },
            )
            self._artifact_metadata_repo.save(record)

            return root_jsons_ref

    # ------------------------------------------------------------------
    # State transitions
    # ------------------------------------------------------------------

    def _mark_stage_started(
        self, job: Job, stage: Stage, command: ParseCatalogCommand
    ) -> None:
        """Transition stage to IN_PROGRESS and job to IN_PROGRESS if needed."""
        stage.start()
        self._stage_repo.save(stage)

        if job.job_state == JobState.CREATED:
            job.start()
            self._job_repo.save(job)

        self._emit_audit_event(
            command, "STAGE_STARTED", {"stage_name": "parse-catalog"}
        )

    def _mark_stage_completed(
        self, stage: Stage, command: ParseCatalogCommand
    ) -> None:
        """Transition stage to COMPLETED."""
        stage.complete()
        self._stage_repo.save(stage)
        self._emit_audit_event(
            command, "STAGE_COMPLETED", {"stage_name": "parse-catalog"}
        )

    def _mark_stage_failed(
        self, stage: Stage, command: ParseCatalogCommand, error: Exception
    ) -> None:
        """Transition stage to FAILED with error details."""
        error_code = type(error).__name__
        error_summary = "Processing failed"
        stage.fail(error_code=error_code, error_summary=error_summary)
        self._stage_repo.save(stage)
        self._emit_audit_event(
            command,
            "STAGE_FAILED",
            {
                "stage_name": "parse-catalog",
                "error_code": error_code,
                "error_summary": error_summary,
            },
        )
        
        # Update job state to FAILED when stage fails
        JobStateHelper.handle_stage_failure(
            job_repo=self._job_repo,
            audit_repo=self._audit_repo,
            uuid_generator=self._uuid_generator,
            job_id=command.job_id,
            stage_name="parse-catalog",
            error_code=error_code,
            error_summary=error_summary,
            correlation_id=str(command.correlation_id),
            client_id=str(command.client_id),
        )

    # ------------------------------------------------------------------
    # Audit
    # ------------------------------------------------------------------

    def _emit_audit_event(
        self,
        command: ParseCatalogCommand,
        event_type: str,
        details: dict,
    ) -> None:
        """Emit an audit event."""
        client_id = (
            self._current_job.client_id
            if self._current_job is not None
            else ClientId("unknown")
        )
        event = AuditEvent(
            event_id=str(self._uuid_generator.generate()),
            job_id=command.job_id,
            event_type=event_type,
            correlation_id=command.correlation_id,
            client_id=client_id,
            timestamp=datetime.now(timezone.utc),
            details=details,
        )
        self._audit_repo.save(event)

    # ------------------------------------------------------------------
    # Result building
    # ------------------------------------------------------------------

    def _build_success_result(
        self,
        command: ParseCatalogCommand,
        catalog_ref: ArtifactRef,
        root_jsons_ref: ArtifactRef,
    ) -> ParseCatalogResult:
        """Build the success result DTO."""
        return ParseCatalogResult(
            job_id=str(command.job_id),
            stage_state="COMPLETED",
            message="Catalog parsed successfully",
            catalog_ref=catalog_ref,
            root_jsons_ref=root_jsons_ref,
            root_json_count=0,  # No longer tracking file count
            arch_os_combinations=[],  # No longer tracking combinations
            completed_at=datetime.now(timezone.utc).isoformat(),
        )


================================================
FILE: build_stream/orchestrator/common/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Common orchestrator components shared across stages."""

from orchestrator.common.result_poller import ResultPoller

__all__ = ["ResultPoller"]


================================================
FILE: build_stream/orchestrator/common/result_poller.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Common result poller for processing playbook execution results from NFS queue.

This module provides a shared ResultPoller that can be used by all stage APIs
(local_repo, build_image, validate_image_on_test, etc.) to poll the NFS result
queue and update stage states accordingly.
"""

import asyncio
import logging
from datetime import datetime, timezone

from api.logging_utils import log_secure_info

from core.jobs.entities import AuditEvent
from core.jobs.entities.stage import StageState
from core.jobs.repositories import (
    AuditEventRepository,
    JobRepository,
    StageRepository,
    UUIDGenerator,
)
from core.jobs.services import JobStateHelper
from core.jobs.value_objects import JobId, StageName
from core.localrepo.entities import PlaybookResult
from core.localrepo.services import PlaybookQueueResultService

logger = logging.getLogger(__name__)


class ResultPoller:
    """Common poller for processing playbook execution results.

    This poller monitors the NFS result queue and processes results
    by updating stage states and emitting audit events. It handles
    results from all stage types (local_repo, build_image,
    validate_image_on_test, etc.).

    Attributes:
        result_service: Service for polling NFS result queue.
        job_repo: Job repository for updating job states.
        stage_repo: Stage repository for updating stage states.
        audit_repo: Audit event repository for emitting events.
        uuid_generator: UUID generator for event IDs.
        poll_interval: Interval in seconds between polls.
        running: Flag indicating if poller is running.
    """

    def __init__(
        self,
        result_service: PlaybookQueueResultService,
        job_repo: JobRepository,
        stage_repo: StageRepository,
        audit_repo: AuditEventRepository,
        uuid_generator: UUIDGenerator,
        poll_interval: int = 5,
    ) -> None:  # pylint: disable=too-many-arguments,too-many-positional-arguments
        """Initialize result poller.

        Args:
            result_service: Service for polling NFS result queue.
            job_repo: Job repository implementation.
            stage_repo: Stage repository implementation.
            audit_repo: Audit event repository implementation.
            uuid_generator: UUID generator for identifiers.
            poll_interval: Interval in seconds between polls (default: 5).
        """
        self._result_service = result_service
        self._job_repo = job_repo
        self._stage_repo = stage_repo
        self._audit_repo = audit_repo
        self._uuid_generator = uuid_generator
        self._poll_interval = poll_interval
        self._running = False
        self._task = None

    async def start(self) -> None:
        """Start the result poller."""
        if self._running:
            logger.warning("Result poller is already running")
            return

        self._running = True
        self._task = asyncio.create_task(self._poll_loop())
        logger.info("Result poller started with interval=%ds", self._poll_interval)

    async def stop(self) -> None:
        """Stop the result poller."""
        if not self._running:
            return

        self._running = False
        if self._task:
            self._task.cancel()
            try:
                await self._task
            except asyncio.CancelledError:
                pass
        logger.info("Result poller stopped")

    async def _poll_loop(self) -> None:
        """Main polling loop."""
        while self._running:
            try:
                processed_count = self._result_service.poll_results(
                    callback=self._on_result_received
                )
                if processed_count > 0:
                    logger.info("Processed %d playbook results", processed_count)
            except Exception as exc:  # pylint: disable=broad-except
                logger.exception("Error polling results: %s", exc)

            await asyncio.sleep(self._poll_interval)

    def _on_result_received(self, result: PlaybookResult) -> None:
        """Handle received playbook result.

        Args:
            result: Playbook execution result from NFS queue.
        """
        try:
            # Find stage
            stage_name = StageName(result.stage_name)
            stage = self._stage_repo.find_by_job_and_name(result.job_id, stage_name)

            if stage is None:
                logger.error(
                    "Stage not found for result: job_id=%s, stage=%s",
                    result.job_id,
                    result.stage_name,
                )
                return

            # Update stage based on result
            # Check if stage is already in terminal state (e.g., after service restart)
            if stage.stage_state in {StageState.COMPLETED, StageState.FAILED, StageState.CANCELLED}:
                logger.info(
                    "Stage already in terminal state: job_id=%s, stage=%s, state=%s",
                    result.job_id,
                    result.stage_name,
                    stage.stage_state,
                )
                # Return early - service will archive the result file automatically
                return
            
            if result.status == "success":
                stage.complete()
                logger.info(
                    "Stage completed: job_id=%s, stage=%s",
                    result.job_id,
                    result.stage_name,
                )
                
                # Check if this is the final stage (validate-image-on-test)
                # If so, mark the job as completed
                if result.stage_name == "validate-image-on-test":
                    JobStateHelper.handle_job_completion(
                        job_repo=self._job_repo,
                        audit_repo=self._audit_repo,
                        uuid_generator=self._uuid_generator,
                        job_id=JobId(result.job_id),
                        correlation_id=result.request_id.value if hasattr(result.request_id, 'value') else str(result.request_id),
                        client_id=str(result.job_id),
                    )
            else:
                error_code = result.error_code or "PLAYBOOK_FAILED"
                error_summary = result.error_summary or "Playbook execution failed"
                stage.fail(error_code=error_code, error_summary=error_summary)
                logger.warning(
                    "Stage failed: job_id=%s, stage=%s, error=%s",
                    result.job_id,
                    result.stage_name,
                    error_code,
                )
                
                # Update job state to FAILED when stage fails
                JobStateHelper.handle_stage_failure(
                    job_repo=self._job_repo,
                    audit_repo=self._audit_repo,
                    uuid_generator=self._uuid_generator,
                    job_id=JobId(result.job_id),
                    stage_name=result.stage_name,
                    error_code=error_code,
                    error_summary=error_summary,
                    correlation_id=result.request_id.value if hasattr(result.request_id, 'value') else str(result.request_id),
                    client_id=str(result.job_id),
                )

            # Update log file path if available
            if result.log_file_path:
                stage.log_file_path = result.log_file_path
                logger.info(
                    "Updated stage log path: job_id=%s, stage=%s",
                    result.job_id,
                    result.stage_name,
                )

            # Save updated stage
            self._stage_repo.save(stage)

            # Emit audit event
            event = AuditEvent(
                event_id=str(self._uuid_generator.generate()),
                job_id=result.job_id,
                event_type="STAGE_COMPLETED" if result.status == "success" else "STAGE_FAILED",
                correlation_id=result.request_id,
                client_id=result.job_id,  # Using job_id as client_id placeholder
                timestamp=datetime.now(timezone.utc),
                details={
                    "stage_name": result.stage_name,
                    "status": result.status,
                    "duration_seconds": result.duration_seconds,
                    "exit_code": result.exit_code,
                },
            )
            self._audit_repo.save(event)
            
            # Commit both repositories if using SQL
            # Note: Each repository may have its own session, so commit both
            if hasattr(self._stage_repo, 'session'):
                self._stage_repo.session.commit()
            if hasattr(self._audit_repo, 'session'):
                    self._audit_repo.session.commit()

            log_secure_info(
                "info",
                f"Result processed for job {result.job_id}, stage {result.stage_name}",
                result.request_id,
            )

        except Exception as exc:  # pylint: disable=broad-except
            logger.exception(
                "Error handling result: job_id=%s, error=%s",
                result.job_id,
                exc,
            )


================================================
FILE: build_stream/orchestrator/jobs/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Jobs application layer package."""

from .commands import CreateJobCommand
from .dtos import JobResponse
from .use_cases import CreateJobUseCase

__all__ = [
    "CreateJobCommand",
    "JobResponse",
    "CreateJobUseCase",
]


================================================
FILE: build_stream/orchestrator/jobs/commands/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Application command DTOs."""

from .create_job import CreateJobCommand

__all__ = ["CreateJobCommand"]


================================================
FILE: build_stream/orchestrator/jobs/commands/create_job.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""CreateJob command DTO."""

from dataclasses import dataclass

from core.jobs.value_objects import (
    ClientId,
    CorrelationId,
    IdempotencyKey,
)


@dataclass(frozen=True)
class CreateJobCommand:
    """Command to create a new job.

    Immutable command object representing the intent to create a job.
    All validation is performed in the use case layer.

    Attributes:
        client_id: Client who owns this job (from auth).
        request_client_id: Client ID from request payload.
        client_name: Optional client name.
        correlation_id: Request correlation identifier for tracing.
        idempotency_key: Client-supplied key for retry deduplication.
    """

    client_id: ClientId
    request_client_id: str
    correlation_id: CorrelationId
    idempotency_key: IdempotencyKey
    client_name: str | None = None


================================================
FILE: build_stream/orchestrator/jobs/dtos/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Application response DTOs."""

from .job_response import JobResponse

__all__ = ["JobResponse"]


================================================
FILE: build_stream/orchestrator/jobs/dtos/job_response.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Job response DTO."""

from dataclasses import dataclass
from typing import Optional


@dataclass(frozen=True)
class JobResponse:
    """Response DTO for job operations.

    Immutable data transfer object for returning job information
    to the API layer. All timestamps are ISO 8601 formatted strings.

    Attributes:
        job_id: Unique job identifier.
        client_id: Client who owns this job.
        catalog_digest: SHA-256 digest of catalog used.
        job_state: Current lifecycle state.
        created_at: Job creation timestamp (ISO 8601).
        updated_at: Last modification timestamp (ISO 8601).
        version: Optimistic locking version.
        tombstoned: Soft delete flag.
        is_new: True if job was newly created, False if retrieved from idempotency.
    """

    job_id: str
    client_id: str
    request_client_id: str
    client_name: Optional[str]
    job_state: str
    created_at: str
    updated_at: str
    version: int
    tombstoned: bool
    is_new: bool = True

    @staticmethod
    def from_entity(job, is_new: bool = True) -> "JobResponse":
        """Create response DTO from Job entity.

        Args:
            job: Job domain entity.
            is_new: True if job was newly created, False if retrieved from idempotency.

        Returns:
            JobResponse DTO with serialized values.
        """
        return JobResponse(
            job_id=str(job.job_id),
            client_id=str(job.client_id),
            request_client_id=job.request_client_id,
            client_name=job.client_name,
            job_state=job.job_state.value,
            created_at=job.created_at.isoformat(),
            updated_at=job.updated_at.isoformat(),
            version=job.version,
            tombstoned=job.tombstoned,
            is_new=is_new,
        )


================================================
FILE: build_stream/orchestrator/jobs/use_cases/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Application use cases."""

from .create_job import CreateJobUseCase

__all__ = ["CreateJobUseCase"]


================================================
FILE: build_stream/orchestrator/jobs/use_cases/create_job.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

# pylint: disable=too-many-arguments,too-many-positional-arguments,too-few-public-methods

"""CreateJob use case implementation."""

from datetime import datetime, timezone
from typing import List, Optional

from core.jobs.entities import Job, Stage, IdempotencyRecord, AuditEvent
from core.jobs.exceptions import (
    JobAlreadyExistsError,
    IdempotencyConflictError,
)
from core.jobs.repositories import (
    JobRepository,
    StageRepository,
    IdempotencyRepository,
    AuditEventRepository,
    JobIdGenerator,
    UUIDGenerator,
)
from core.jobs.services import FingerprintService
from core.jobs.value_objects import JobId, StageName, StageType, RequestFingerprint

from ..commands import CreateJobCommand
from ..dtos import JobResponse


class CreateJobUseCase:
    """Use case for creating a new job with idempotency support.

    This use case orchestrates job creation with the following guarantees:
    - Idempotency: Same idempotency key returns same result
    - Atomicity: All-or-nothing persistence (job + stages + idempotency record)
    - Audit trail: Emits JOB_CREATED event
    - Initial stages: Creates all 5 stages in PENDING state

    Attributes:
        job_repo: Job repository port.
        stage_repo: Stage repository port.
        idempotency_repo: Idempotency repository port.
        audit_repo: Audit event repository port.
    """

    def __init__(
        self,
        job_repo: JobRepository,
        stage_repo: StageRepository,
        idempotency_repo: IdempotencyRepository,
        audit_repo: AuditEventRepository,
        job_id_generator: JobIdGenerator,
        uuid_generator: UUIDGenerator,
    ) -> None:
        """Initialize use case with repository dependencies.

        Args:
            job_repo: Job repository implementation.
            stage_repo: Stage repository implementation.
            idempotency_repo: Idempotency repository implementation.
            audit_repo: Audit event repository implementation.
            job_id_generator: Job identifier generator to use.
            uuid_generator: UUID generator for events and other identifiers.
        """
        self._job_repo = job_repo
        self._stage_repo = stage_repo
        self._idempotency_repo = idempotency_repo
        self._audit_repo = audit_repo
        self._job_id_generator = job_id_generator
        self._uuid_generator = uuid_generator

    def execute(self, command: CreateJobCommand) -> JobResponse:
        """Execute job creation with idempotency.

        Args:
            command: CreateJob command with job details.

        Returns:
            JobResponse DTO with created job details.

        Raises:
            JobAlreadyExistsError: If job_id already exists.
            IdempotencyConflictError: If idempotency key exists with different fingerprint.
        """
        fingerprint = self._compute_fingerprint(command)
        existing_job = self._check_idempotency(command, fingerprint)
        if existing_job is not None:
            return self._to_response(existing_job, is_new=False)

        job_id = self._generate_job_id(command)

        job = self._build_job(command, job_id)
        stages = self._create_initial_stages(job_id)

        self._save_job_and_stages(job, stages)
        self._save_idempotency_record(command, job_id, fingerprint)
        self._emit_job_created_event(command, job_id, stages)

        return self._to_response(job)

    def _generate_job_id(self, command: CreateJobCommand) -> JobId:
        """Generate a new JobId and ensure it is not already used."""
        job_id = self._job_id_generator.generate()
        if self._job_repo.exists(job_id):
            raise JobAlreadyExistsError(
                job_id=str(job_id),
                correlation_id=str(command.correlation_id),
            )
        return job_id

    def _check_idempotency(
        self,
        command: CreateJobCommand,
        fingerprint: RequestFingerprint,
    ) -> Optional[Job]:
        """Return existing job for idempotent retries, or raise on conflicts."""
        existing_record = self._idempotency_repo.find_by_key(command.idempotency_key)
        if existing_record is None:
            return None

        if not existing_record.matches_fingerprint(fingerprint):
            raise IdempotencyConflictError(
                idempotency_key=str(command.idempotency_key),
                existing_job_id=str(existing_record.job_id),
                correlation_id=str(command.correlation_id),
            )

        return self._job_repo.find_by_id(existing_record.job_id)

    def _build_job(self, command: CreateJobCommand, job_id: JobId) -> Job:
        """Build the Job aggregate for a create request."""
        return Job(
            job_id=job_id,
            client_id=command.client_id,
            request_client_id=command.request_client_id,
            client_name=command.client_name,
        )

    def _save_job_and_stages(self, job: Job, stages: List[Stage]) -> None:
        """Persist the job aggregate and its initial stages."""
        self._job_repo.save(job)
        self._stage_repo.save_all(stages)

    def _save_idempotency_record(
        self,
        command: CreateJobCommand,
        job_id: JobId,
        fingerprint: RequestFingerprint,
    ) -> None:
        """Persist idempotency record for create job."""
        now = self._now_utc()
        record = IdempotencyRecord(
            idempotency_key=command.idempotency_key,
            job_id=job_id,
            request_fingerprint=fingerprint,
            client_id=command.client_id,
            created_at=now,
            expires_at=now.replace(hour=23, minute=59, second=59),
        )
        self._idempotency_repo.save(record)

    def _emit_job_created_event(
        self,
        command: CreateJobCommand,
        job_id: JobId,
        stages: List[Stage],
    ) -> None:
        """Emit an audit event for job creation."""
        event = AuditEvent(
            event_id=self._generate_event_id(),
            job_id=job_id,
            event_type="JOB_CREATED",
            correlation_id=command.correlation_id,
            client_id=command.client_id,
            timestamp=self._now_utc(),
            details={
                "client_name": command.client_name,
                "stage_count": len(stages),
            },
        )
        self._audit_repo.save(event)

    def _to_response(self, job: Job, is_new: bool = True) -> JobResponse:
        """Map domain entity to response DTO."""
        return JobResponse.from_entity(job, is_new=is_new)

    def _now_utc(self) -> datetime:
        """Return current UTC timestamp."""
        return datetime.now(timezone.utc)

    def _compute_fingerprint(self, command: CreateJobCommand) -> RequestFingerprint:
        """Compute request fingerprint for idempotency.
        Fingerprint includes only request payload, not auth-derived fields."""

        request_body = {}
        if command.client_name:
            request_body["client_name"] = command.client_name
        return FingerprintService.compute(request_body)

    def _create_initial_stages(self, job_id: JobId) -> List[Stage]:
        """Create initial stages for the job.

        Creates all 9 stages in PENDING state:
        - PARSE_CATALOG
        - GENERATE_INPUT_FILES
        - CREATE_LOCAL_REPOSITORY
        - UPDATE_LOCAL_REPOSITORY
        - CREATE_IMAGE_REPOSITORY
        - BUILD_IMAGE
        - VALIDATE_IMAGE
        - VALIDATE_IMAGE_ON_TEST
        - PROMOTE

        Returns:
            List of Stage entities in PENDING state.
        """
        stages = []
        for stage_type in StageType:
            stage = Stage(
                job_id=job_id,
                stage_name=StageName(stage_type.value),
            )
            stages.append(stage)

        return stages

    def _generate_event_id(self) -> str:
        """Generate event ID for audit events.
        
        Returns:
            UUID v4 string for event identifier.
        """
        return str(self._uuid_generator.generate())


================================================
FILE: build_stream/orchestrator/local_repo/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Local repository orchestrator module."""


================================================
FILE: build_stream/orchestrator/local_repo/commands/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Application command DTOs for local repository."""

from orchestrator.local_repo.commands.create_local_repo import CreateLocalRepoCommand

__all__ = ["CreateLocalRepoCommand"]


================================================
FILE: build_stream/orchestrator/local_repo/commands/create_local_repo.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""CreateLocalRepo command DTO."""

from dataclasses import dataclass

from core.jobs.value_objects import ClientId, CorrelationId, JobId


@dataclass(frozen=True)
class CreateLocalRepoCommand:
    """Command to trigger local repository creation stage.

    Immutable command object representing the intent to execute
    the create-local-repository stage for a given job.

    Attributes:
        job_id: Job identifier from URL path.
        client_id: Client who owns this job (from auth).
        correlation_id: Request correlation identifier for tracing.
    """

    job_id: JobId
    client_id: ClientId
    correlation_id: CorrelationId


================================================
FILE: build_stream/orchestrator/local_repo/dtos/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Application response DTOs for local repository."""

from orchestrator.local_repo.dtos.local_repo_response import LocalRepoResponse

__all__ = ["LocalRepoResponse"]


================================================
FILE: build_stream/orchestrator/local_repo/dtos/local_repo_response.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Local repository response DTO."""

from dataclasses import dataclass


@dataclass(frozen=True)
class LocalRepoResponse:
    """Response DTO for local repository stage operations.

    Immutable data transfer object for returning stage acceptance
    information to the API layer.

    Attributes:
        job_id: Parent job identifier.
        stage_name: Stage identifier (create-local-repository).
        status: Acceptance status (accepted).
        submitted_at: Submission timestamp (ISO 8601).
        correlation_id: Request correlation identifier.
    """

    job_id: str
    stage_name: str
    status: str
    submitted_at: str
    correlation_id: str


================================================
FILE: build_stream/orchestrator/local_repo/result_poller.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Backward-compatible alias for the common ResultPoller.

The result poller has been promoted to orchestrator.common.result_poller
so that all stage APIs (local_repo, build_image, validate_image_on_test)
share a single poller instance. This module re-exports the class under
its original name for backward compatibility.
"""

from orchestrator.common.result_poller import ResultPoller

# Backward-compatible alias
LocalRepoResultPoller = ResultPoller

__all__ = ["LocalRepoResultPoller"]


================================================
FILE: build_stream/orchestrator/local_repo/use_cases/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Application use cases for local repository."""

from orchestrator.local_repo.use_cases.create_local_repo import CreateLocalRepoUseCase

__all__ = ["CreateLocalRepoUseCase"]


================================================
FILE: build_stream/orchestrator/local_repo/use_cases/create_local_repo.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""CreateLocalRepo use case implementation."""

import logging
from datetime import datetime, timezone

from api.logging_utils import log_secure_info

from core.jobs.entities import AuditEvent, Stage
from core.jobs.exceptions import (
    JobNotFoundError,
    StageAlreadyCompletedError,
    InvalidStateTransitionError,
    UpstreamStageNotCompletedError,
)
from core.jobs.repositories import (
    AuditEventRepository,
    JobRepository,
    StageRepository,
    UUIDGenerator,
)
from core.jobs.services import JobStateHelper
from core.jobs.value_objects import (
    StageName,
    StageType,
    StageState,
)
from core.localrepo.entities import PlaybookRequest
from core.localrepo.exceptions import (
    InputDirectoryInvalidError,
    InputFilesMissingError,
)
from core.localrepo.services import (
    InputFileService,
    PlaybookQueueRequestService,
)
from core.localrepo.value_objects import (
    ExecutionTimeout,
    ExtraVars,
    PlaybookPath,
)

from orchestrator.local_repo.commands import CreateLocalRepoCommand
from orchestrator.local_repo.dtos import LocalRepoResponse

logger = logging.getLogger(__name__)

DEFAULT_PLAYBOOK_NAME = "local_repo.yml"


class CreateLocalRepoUseCase:
    """Use case for triggering the create-local-repository stage.

    This use case orchestrates stage execution with the following guarantees:
    - Stage guard enforcement: Only PENDING stages can be started
    - Job ownership verification: Client must own the job
    - Input file validation: Prerequisites checked before playbook execution
    - Audit trail: Emits STAGE_STARTED event
    - NFS queue submission: Submits playbook request to NFS queue for watcher service

    Attributes:
        job_repo: Job repository port.
        stage_repo: Stage repository port.
        audit_repo: Audit event repository port.
        input_file_service: Input file validation and preparation service.
        playbook_queue_service: NFS queue service for submitting playbook requests.
        uuid_generator: UUID generator for events and request IDs.
    """

    def __init__(
        self,
        job_repo: JobRepository,
        stage_repo: StageRepository,
        audit_repo: AuditEventRepository,
        input_file_service: InputFileService,
        playbook_queue_service: PlaybookQueueRequestService,
        uuid_generator: UUIDGenerator,
    ) -> None:  # pylint: disable=too-many-arguments,too-many-positional-arguments
        """Initialize use case with repository and service dependencies.

        Args:
            job_repo: Job repository implementation.
            stage_repo: Stage repository implementation.
            audit_repo: Audit event repository implementation.
            input_file_service: Input file service for validation.
            playbook_queue_service: NFS queue service for submitting requests.
            uuid_generator: UUID generator for identifiers.
        """
        self._job_repo = job_repo
        self._stage_repo = stage_repo
        self._audit_repo = audit_repo
        self._input_file_service = input_file_service
        self._playbook_queue_service = playbook_queue_service
        self._uuid_generator = uuid_generator

    def execute(self, command: CreateLocalRepoCommand) -> LocalRepoResponse:
        """Execute the create-local-repository stage.

        Args:
            command: CreateLocalRepo command with job details.

        Returns:
            LocalRepoResponse DTO with acceptance details.

        Raises:
            JobNotFoundError: If job does not exist or client mismatch.
            InvalidStateTransitionError: If stage is not in PENDING state.
            InputFilesMissingError: If prerequisite input files are missing.
            InputDirectoryInvalidError: If input directory is invalid.
            QueueUnavailableError: If NFS queue is not accessible.
        """
        self._validate_job(command)
        stage = self._validate_stage(command)

        self._prepare_input_files(command, stage)

        request = self._build_playbook_request(command)
        self._submit_to_queue(command, request, stage)

        self._emit_stage_started_event(command)

        return self._to_response(command, request)

    def _validate_job(self, command: CreateLocalRepoCommand):
        """Validate job exists and belongs to the requesting client."""
        job = self._job_repo.find_by_id(command.job_id)
        if job is None or job.tombstoned:
            raise JobNotFoundError(
                job_id=str(command.job_id),
                correlation_id=str(command.correlation_id),
            )

        if job.client_id != command.client_id:
            raise JobNotFoundError(
                job_id=str(command.job_id),
                correlation_id=str(command.correlation_id),
            )

        return job

    def _verify_upstream_stage_completed(
        self, command: CreateLocalRepoCommand
    ) -> None:
        """Verify that generate-input-files stage is COMPLETED."""
        from core.jobs.value_objects import StageState
        
        prerequisite_stage = self._stage_repo.find_by_job_and_name(
            command.job_id, 
            StageName(StageType.GENERATE_INPUT_FILES.value)
        )
        if (
            prerequisite_stage is None
            or prerequisite_stage.stage_state != StageState.COMPLETED
        ):
            raise UpstreamStageNotCompletedError(
                job_id=str(command.job_id),
                required_stage="generate-input-files",
                actual_state=(
                    prerequisite_stage.stage_state.value
                    if prerequisite_stage
                    else "NOT_FOUND"
                ),
                correlation_id=str(command.correlation_id),
            )

    def _validate_stage(self, command: CreateLocalRepoCommand) -> Stage:
        """Validate stage exists and is not already COMPLETED or IN_PROGRESS or in PENDING state."""
        from core.jobs.value_objects import StageState
        
        # Verify upstream stage is completed
        self._verify_upstream_stage_completed(command)
        
        stage_name = StageName(StageType.CREATE_LOCAL_REPOSITORY.value)
        stage = self._stage_repo.find_by_job_and_name(command.job_id, stage_name)

        if stage is None:
            raise JobNotFoundError(
                job_id=str(command.job_id),
                correlation_id=str(command.correlation_id),
            )
        
        # Reject COMPLETED stages (already done)
        if stage.stage_state == StageState.COMPLETED:
            raise StageAlreadyCompletedError(
                job_id=str(command.job_id),
                stage_name="create-local-repository",
                correlation_id=str(command.correlation_id),
            )
        
        # Only allow PENDING stages to transition to IN_PROGRESS
        if stage.stage_state != StageState.PENDING:
            if stage.stage_state == StageState.FAILED:
                raise InvalidStateTransitionError(
                    entity_type="Stage",
                    entity_id=f"{command.job_id}/create-local-repository",
                    from_state=stage.stage_state.value,
                    to_state="IN_PROGRESS",
                    correlation_id=str(command.correlation_id),
                )
            else:
                # For COMPLETED, IN_PROGRESS, CANCELLED states
                raise InvalidStateTransitionError(
                    entity_type="Stage",
                    entity_id=f"{command.job_id}/create-local-repository",
                    from_state=stage.stage_state.value,
                    to_state="IN_PROGRESS",
                    correlation_id=str(command.correlation_id),
                )
        
        # Allow only FAILED stages (retry allowed)
        return stage

    def _prepare_input_files(
        self,
        command: CreateLocalRepoCommand,
        stage: Stage,
    ) -> None:
        """Prepare input files as prerequisite for playbook execution.

        If input preparation fails, the stage is transitioned to FAILED
        and the error is re-raised to prevent playbook invocation.
        """
        try:
            self._input_file_service.prepare_playbook_input(
                job_id=str(command.job_id),
                correlation_id=str(command.correlation_id),
            )
        except (InputFilesMissingError, InputDirectoryInvalidError) as exc:
            try:
                error_code = type(exc).__name__.upper()
                error_summary = "Input preparation failed"
                stage.start()
                stage.fail(
                    error_code=error_code,
                    error_summary=error_summary,
                )
                self._stage_repo.save(stage)
                
                # Update job state to FAILED when stage fails
                JobStateHelper.handle_stage_failure(
                    job_repo=self._job_repo,
                    audit_repo=self._audit_repo,
                    uuid_generator=self._uuid_generator,
                    job_id=command.job_id,
                    stage_name=StageType.CREATE_LOCAL_REPOSITORY.value,
                    error_code=error_code,
                    error_summary=error_summary,
                    correlation_id=str(command.correlation_id),
                    client_id=str(command.client_id),
                )
            except Exception as save_exc:
                # If save fails, stage was modified elsewhere
                log_secure_info(
                    "Stage fail save failed, stage already modified elsewhere: %s",
                    str(save_exc)
                )
            log_secure_info(
                "error",
                f"Input preparation failed for job {command.job_id}",
                str(command.correlation_id),
            )
            raise

    def _build_playbook_request(
        self,
        command: CreateLocalRepoCommand,
    ) -> PlaybookRequest:
        """Build a PlaybookRequest entity from the command."""
        return PlaybookRequest(
            job_id=str(command.job_id),
            stage_name=StageType.CREATE_LOCAL_REPOSITORY.value,
            playbook_path=PlaybookPath(DEFAULT_PLAYBOOK_NAME),
            extra_vars=ExtraVars(values={}),
            correlation_id=str(command.correlation_id),
            timeout=ExecutionTimeout.default(),
            submitted_at=datetime.now(timezone.utc).isoformat() + "Z",
            request_id=str(self._uuid_generator.generate()),
        )

    def _submit_to_queue(
        self,
        command: CreateLocalRepoCommand,
        request: PlaybookRequest,
        stage: Stage,
    ) -> None:
        """Submit playbook request to NFS queue for watcher service."""
        try:
            stage.start()
            self._stage_repo.save(stage)
        except Exception as save_exc:
            # If save fails, stage was modified elsewhere, continue with queue submission
            log_secure_info(
                "Stage start save failed, continuing with queue submission: %s",
                str(save_exc)
            )

        # Submit request to NFS queue
        self._playbook_queue_service.submit_request(
            request=request,
            correlation_id=str(command.correlation_id),
        )

        logger.info(
            "Playbook request submitted to queue for job %s, stage=%s, correlation_id=%s",
            command.job_id,
            StageType.CREATE_LOCAL_REPOSITORY.value,
            command.correlation_id,
        )


    def _emit_stage_started_event(
        self,
        command: CreateLocalRepoCommand,
    ) -> None:
        """Emit an audit event for stage start."""
        event = AuditEvent(
            event_id=str(self._uuid_generator.generate()),
            job_id=command.job_id,
            event_type="STAGE_STARTED",
            correlation_id=command.correlation_id,
            client_id=command.client_id,
            timestamp=datetime.now(timezone.utc),
            details={
                "stage_name": StageType.CREATE_LOCAL_REPOSITORY.value,
            },
        )
        self._audit_repo.save(event)

    def _to_response(
        self,
        command: CreateLocalRepoCommand,
        request: PlaybookRequest,
    ) -> LocalRepoResponse:
        """Map to response DTO."""
        return LocalRepoResponse(
            job_id=str(command.job_id),
            stage_name=StageType.CREATE_LOCAL_REPOSITORY.value,
            status="accepted",
            submitted_at=request.submitted_at,
            correlation_id=str(command.correlation_id),
        )


================================================
FILE: build_stream/orchestrator/validate/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""ValidateImageOnTest orchestration module."""

from orchestrator.validate.commands import ValidateImageOnTestCommand
from orchestrator.validate.dtos import ValidateImageOnTestResponse
from orchestrator.validate.use_cases import ValidateImageOnTestUseCase

__all__ = [
    "ValidateImageOnTestCommand",
    "ValidateImageOnTestResponse",
    "ValidateImageOnTestUseCase",
]


================================================
FILE: build_stream/orchestrator/validate/commands/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""ValidateImageOnTest command DTOs."""

from orchestrator.validate.commands.validate_image_on_test import ValidateImageOnTestCommand

__all__ = ["ValidateImageOnTestCommand"]


================================================
FILE: build_stream/orchestrator/validate/commands/validate_image_on_test.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""ValidateImageOnTest command DTO."""

from dataclasses import dataclass

from core.jobs.value_objects import ClientId, CorrelationId, JobId


@dataclass(frozen=True)
class ValidateImageOnTestCommand:
    """Command to trigger validate-image-on-test stage.

    Immutable command object representing the intent to execute
    the validate-image-on-test stage for a given job.

    Attributes:
        job_id: Job identifier from URL path.
        client_id: Client who owns this job (from auth).
        correlation_id: Request correlation identifier for tracing.
        image_key: Image key for the build to validate.
    """

    job_id: JobId
    client_id: ClientId
    correlation_id: CorrelationId
    image_key: str


================================================
FILE: build_stream/orchestrator/validate/dtos/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""ValidateImageOnTest response DTOs."""

from orchestrator.validate.dtos.validate_image_on_test_response import ValidateImageOnTestResponse

__all__ = ["ValidateImageOnTestResponse"]


================================================
FILE: build_stream/orchestrator/validate/dtos/validate_image_on_test_response.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""ValidateImageOnTest response DTO."""

from dataclasses import dataclass


@dataclass(frozen=True)
class ValidateImageOnTestResponse:
    """Response DTO for validate-image-on-test stage acceptance.

    Attributes:
        job_id: Job identifier.
        stage_name: Stage identifier.
        status: Acceptance status.
        submitted_at: Submission timestamp (ISO 8601).
        correlation_id: Correlation identifier.
    """

    job_id: str
    stage_name: str
    status: str
    submitted_at: str
    correlation_id: str


================================================
FILE: build_stream/orchestrator/validate/use_cases/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""ValidateImageOnTest use cases."""

from orchestrator.validate.use_cases.validate_image_on_test import ValidateImageOnTestUseCase

__all__ = ["ValidateImageOnTestUseCase"]


================================================
FILE: build_stream/orchestrator/validate/use_cases/validate_image_on_test.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""ValidateImageOnTest use case implementation."""

import logging
from datetime import datetime, timezone

from api.logging_utils import log_secure_info

from core.jobs.entities import AuditEvent, Stage
from core.jobs.exceptions import (
    JobNotFoundError,
    UpstreamStageNotCompletedError,
    InvalidStateTransitionError,
)
from core.jobs.repositories import (
    AuditEventRepository,
    JobRepository,
    StageRepository,
    UUIDGenerator,
)
from core.jobs.services import JobStateHelper
from core.jobs.value_objects import (
    StageName,
    StageState,
    StageType,
)
from core.localrepo.value_objects import (
    ExecutionTimeout,
    ExtraVars,
    PlaybookPath,
)
from core.validate.entities import ValidateImageOnTestRequest
from core.validate.exceptions import (
    StageGuardViolationError,
    ValidationExecutionError,
)
from core.validate.services import ValidateQueueService

from orchestrator.validate.commands import ValidateImageOnTestCommand
from orchestrator.validate.dtos import ValidateImageOnTestResponse

logger = logging.getLogger(__name__)

DISCOVERY_PLAYBOOK_NAME = "discovery.yml"
DEFAULT_TIMEOUT_MINUTES = 60


class ValidateImageOnTestUseCase:
    """Use case for triggering the validate-image-on-test stage.

    This use case orchestrates stage execution with the following guarantees:
    - Stage guard enforcement: BuildImage stage(s) must be completed
    - Job ownership verification: Client must own the job
    - Audit trail: Emits STAGE_STARTED event
    - NFS queue submission: Submits playbook request to NFS queue for watcher service

    Attributes:
        job_repo: Job repository port.
        stage_repo: Stage repository port.
        audit_repo: Audit event repository port.
        queue_service: Validate queue service.
        uuid_generator: UUID generator for events and request IDs.
    """

    def __init__(
        self,
        job_repo: JobRepository,
        stage_repo: StageRepository,
        audit_repo: AuditEventRepository,
        queue_service: ValidateQueueService,
        uuid_generator: UUIDGenerator,
    ) -> None:  # pylint: disable=too-many-arguments,too-many-positional-arguments
        """Initialize use case with repository and service dependencies.

        Args:
            job_repo: Job repository implementation.
            stage_repo: Stage repository implementation.
            audit_repo: Audit event repository implementation.
            queue_service: Validate queue service.
            uuid_generator: UUID generator for identifiers.
        """
        self._job_repo = job_repo
        self._stage_repo = stage_repo
        self._audit_repo = audit_repo
        self._queue_service = queue_service
        self._uuid_generator = uuid_generator

    def execute(self, command: ValidateImageOnTestCommand) -> ValidateImageOnTestResponse:
        """Execute the validate-image-on-test stage.

        Args:
            command: ValidateImageOnTest command with job details.

        Returns:
            ValidateImageOnTestResponse DTO with acceptance details.

        Raises:
            JobNotFoundError: If job does not exist or client mismatch.
            StageGuardViolationError: If upstream build-image stage not completed.
            ValidationExecutionError: If queue submission fails.
        """
        self._validate_job(command)
        stage = self._validate_stage(command)
        self._enforce_stage_guard(command)

        request = self._create_request(command)
        self._submit_to_queue(command, request, stage)
        self._emit_stage_started_event(command)

        return self._to_response(command, request)

    def _validate_job(self, command: ValidateImageOnTestCommand) -> None:
        """Validate job exists and belongs to the requesting client."""
        job = self._job_repo.find_by_id(command.job_id)
        if job is None or job.tombstoned:
            raise JobNotFoundError(
                job_id=str(command.job_id),
                correlation_id=str(command.correlation_id),
            )

        if job.client_id != command.client_id:
            raise JobNotFoundError(
                job_id=str(command.job_id),
                correlation_id=str(command.correlation_id),
            )

    def _validate_stage(self, command: ValidateImageOnTestCommand) -> Stage:
        """Validate stage exists and is in PENDING state."""
        stage_name = StageName(StageType.VALIDATE_IMAGE_ON_TEST.value)
        stage = self._stage_repo.find_by_job_and_name(command.job_id, stage_name)

        if stage is None:
            raise JobNotFoundError(
                job_id=str(command.job_id),
                correlation_id=str(command.correlation_id),
            )

        if stage.stage_state != StageState.PENDING:
            raise InvalidStateTransitionError(
                entity_type="Stage",
                entity_id=f"{command.job_id}/validate-image-on-test",
                from_state=stage.stage_state.value,
                to_state="IN_PROGRESS",
                correlation_id=str(command.correlation_id),
            )

        return stage

    def _enforce_stage_guard(self, command: ValidateImageOnTestCommand) -> None:
        """Enforce that at least one build-image stage has completed.

        The validate-image-on-test stage requires that at least one of the
        build-image stages (x86_64 or aarch64) has completed successfully.
        """
        x86_stage_name = StageName(StageType.BUILD_IMAGE_X86_64.value)
        aarch64_stage_name = StageName(StageType.BUILD_IMAGE_AARCH64.value)

        x86_stage = self._stage_repo.find_by_job_and_name(
            command.job_id, x86_stage_name
        )
        aarch64_stage = self._stage_repo.find_by_job_and_name(
            command.job_id, aarch64_stage_name
        )

        x86_completed = (
            x86_stage is not None
            and x86_stage.stage_state == StageState.COMPLETED
        )
        aarch64_completed = (
            aarch64_stage is not None
            and aarch64_stage.stage_state == StageState.COMPLETED
        )

        if not x86_completed and not aarch64_completed:
            # Determine which stages exist and their states for error message
            x86_state = x86_stage.stage_state.value if x86_stage else "NOT_FOUND"
            aarch64_state = aarch64_stage.stage_state.value if aarch64_stage else "NOT_FOUND"
            
            raise UpstreamStageNotCompletedError(
                job_id=str(command.job_id),
                required_stage="build-image-x86_64 or build-image-aarch64",
                actual_state=f"x86_64: {x86_state}, aarch64: {aarch64_state}",
                correlation_id=str(command.correlation_id),
            )

    def _create_request(
        self,
        command: ValidateImageOnTestCommand,
    ) -> ValidateImageOnTestRequest:
        """Create ValidateImageOnTestRequest entity."""
        playbook_path = PlaybookPath(DISCOVERY_PLAYBOOK_NAME)

        # Get image_key from the API request
        image_key = command.image_key

        extra_vars_dict = {
            "job_id": str(command.job_id),
            "image_key": image_key,
        }
        extra_vars = ExtraVars(extra_vars_dict)

        return ValidateImageOnTestRequest(
            job_id=str(command.job_id),
            stage_name=StageType.VALIDATE_IMAGE_ON_TEST.value,
            playbook_path=playbook_path,
            extra_vars=extra_vars,
            correlation_id=str(command.correlation_id),
            timeout=ExecutionTimeout(DEFAULT_TIMEOUT_MINUTES),
            submitted_at=datetime.now(timezone.utc).isoformat().replace("+00:00", "Z"),
            request_id=str(self._uuid_generator.generate()),
        )

    def _submit_to_queue(
        self,
        command: ValidateImageOnTestCommand,
        request: ValidateImageOnTestRequest,
        stage: Stage,
    ) -> None:
        """Submit playbook request to NFS queue for watcher service."""
        try:
            stage.start()
            self._stage_repo.save(stage)
        except Exception as save_exc:
            # If save fails, stage was modified elsewhere, continue with queue submission
            log_secure_info(
                "Stage start save failed, continuing with queue submission: %s",
                str(save_exc)
            )

        try:
            self._queue_service.submit_request(
                request=request,
                correlation_id=str(command.correlation_id),
            )
        except Exception as exc:
            try:
                error_code = "QUEUE_SUBMISSION_FAILED"
                error_summary = str(exc)
                stage.fail(
                    error_code=error_code,
                    error_summary=error_summary,
                )
                self._stage_repo.save(stage)
                
                # Update job state to FAILED when stage fails
                JobStateHelper.handle_stage_failure(
                    job_repo=self._job_repo,
                    audit_repo=self._audit_repo,
                    uuid_generator=self._uuid_generator,
                    job_id=command.job_id,
                    stage_name=StageType.VALIDATE_IMAGE_ON_TEST.value,
                    error_code=error_code,
                    error_summary=error_summary,
                    correlation_id=str(command.correlation_id),
                    client_id=str(command.client_id),
                )
            except Exception as save_exc:
                # If save fails, stage was modified elsewhere
                log_secure_info(
                    "Stage fail save failed, stage already modified elsewhere: %s",
                    str(save_exc)
                )
            log_secure_info(
                "error",
                f"Queue submission failed for job {command.job_id}",
                str(command.correlation_id),
            )
            raise ValidationExecutionError(
                message=f"Failed to submit validation request: {exc}",
                correlation_id=str(command.correlation_id),
            ) from exc

        logger.info(
            "Validate-image-on-test request submitted to queue for job %s, "
            "correlation_id=%s",
            command.job_id,
            command.correlation_id,
        )

    def _emit_stage_started_event(
        self,
        command: ValidateImageOnTestCommand,
    ) -> None:
        """Emit an audit event for stage start."""
        event = AuditEvent(
            event_id=str(self._uuid_generator.generate()),
            job_id=command.job_id,
            event_type="STAGE_STARTED",
            correlation_id=command.correlation_id,
            client_id=command.client_id,
            timestamp=datetime.now(timezone.utc),
            details={
                "stage_name": StageType.VALIDATE_IMAGE_ON_TEST.value,
            },
        )
        self._audit_repo.save(event)

    def _to_response(
        self,
        command: ValidateImageOnTestCommand,
        request: ValidateImageOnTestRequest,
    ) -> ValidateImageOnTestResponse:
        """Map to response DTO."""
        return ValidateImageOnTestResponse(
            job_id=str(command.job_id),
            stage_name=StageType.VALIDATE_IMAGE_ON_TEST.value,
            status="accepted",
            submitted_at=request.submitted_at,
            correlation_id=str(command.correlation_id),
        )


================================================
FILE: build_stream/playbook-watcher/playbook_watcher_service.py
================================================
#!/usr/bin/env python3
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Playbook Watcher Service for OIM Core Container.

This service monitors the NFS playbook request queue, executes Ansible playbooks,
and writes results back to the results queue. It is designed to be stateless and
run as a systemd service in the OIM Core container.

Architecture:
- Polls /opt/omnia/build_stream/playbook_queue/requests/ every 2 seconds
- Moves requests to processing/ to prevent duplicate execution
- Executes ansible-playbook with timeout and error handling
- Writes structured results to /opt/omnia/build_stream/playbook_queue/results/
- Supports max 5 concurrent playbook executions
"""

import json
import logging
import os
import re
import shutil
import signal
import subprocess
import sys
import time
from datetime import datetime, timezone
from pathlib import Path
from threading import Thread, Semaphore
from typing import Dict, Optional, Any, List

# Implicit logging utilities for secure logging
def log_secure_info(level: str, message: str, identifier: Optional[str] = None) -> None:
    """Log information securely with optional identifier truncation.

    This function provides consistent secure logging across all modules.
    When an identifier is provided, only the first 8 characters are logged
    to prevent exposure of sensitive data while maintaining debugging capability.

    Args:
        level: Log level ('info', 'warning', 'error', 'debug', 'critical')
        message: Log message template
        identifier: Optional identifier (job_id, request_id, etc.) - first 8 chars logged
    """
    logger = logging.getLogger(__name__)

    if identifier:
        # Always log first 8 characters for identification
        log_message = f"{message}: {identifier[:8]}..."
    else:
        # Generic message when no identifier context
        log_message = message

    log_func = getattr(logger, level)
    log_func(log_message)

# Configuration
QUEUE_BASE = Path(os.getenv("PLAYBOOK_QUEUE_BASE", ""))
REQUESTS_DIR = QUEUE_BASE / "requests"
RESULTS_DIR = QUEUE_BASE / "results"
PROCESSING_DIR = QUEUE_BASE / "processing"
ARCHIVE_DIR = QUEUE_BASE / "archive"

# NFS shared path configuration
NFS_SHARE_PATH = Path(os.getenv("NFS_SHARE_PATH", ""))
HOST_LOG_BASE_DIR = NFS_SHARE_PATH / "omnia" / "log" / "build_stream"
CONTAINER_LOG_BASE_DIR = Path("/opt/omnia/log/build_stream")

POLL_INTERVAL_SECONDS = int(os.getenv("POLL_INTERVAL_SECONDS", "2"))
MAX_CONCURRENT_JOBS = int(os.getenv("MAX_CONCURRENT_JOBS", "1"))
DEFAULT_TIMEOUT_MINUTES = int(os.getenv("DEFAULT_TIMEOUT_MINUTES", "30"))

# Playbook name to full path mapping - prevents injection from user input
PLAYBOOK_NAME_TO_PATH = {
    "include_input_dir.yml": "/omnia/utils/include_input_dir.yml",
    "build_image_aarch64.yml": "/omnia/build_image_aarch64/build_image_aarch64.yml",
    "build_image_x86_64.yml": "/omnia/build_image_x86_64/build_image_x86_64.yml",
    "discovery.yml": "/omnia/discovery/discovery.yml",
    "local_repo.yml": "/omnia/local_repo/local_repo.yml",
}

# Logging configuration
LOG_LEVEL = os.getenv("LOG_LEVEL", "INFO")
logging.basicConfig(
    level=getattr(logging, LOG_LEVEL),
    format="%(asctime)s - %(name)s - %(levelname)s - %(message)s",
    handlers=[
        logging.StreamHandler(sys.stdout)
    ]
)
logger = logging.getLogger("playbook_watcher")

# Global state
SHUTDOWN_REQUESTED = False
job_semaphore = Semaphore(MAX_CONCURRENT_JOBS)


def signal_handler(signum, _):
    """Handle shutdown signals gracefully."""
    global SHUTDOWN_REQUESTED
    log_secure_info(
        "info",
        "Received signal",
        str(signum)
    )
    SHUTDOWN_REQUESTED = True


def ensure_directories():
    """Ensure all required directories exist with proper permissions."""
    directories = [
        REQUESTS_DIR,
        RESULTS_DIR,
        PROCESSING_DIR,
        ARCHIVE_DIR,
        ARCHIVE_DIR / "requests",
        ARCHIVE_DIR / "results",
        HOST_LOG_BASE_DIR,  # NFS log directory
    ]

    for directory in directories:
        try:
            directory.mkdir(parents=True, exist_ok=True)
            log_secure_info(
                "debug",
                "Ensured directory exists"
            )
        except (OSError, IOError) as e:
            log_secure_info(
                "error",
                "Failed to create directory"
            )
            raise


def validate_playbook_name(playbook_name: str) -> bool:
    """Validate playbook name against the allowed whitelist.

    Args:
        playbook_name: Name of the playbook file (without path)

    Returns:
        True if name is in the whitelist, False otherwise
    """
    # Ensure it's a playbook name (no slash)
    if '/' in playbook_name:
        log_secure_info(
            "error",
            "Playbook name cannot contain path separators",
            playbook_name[:8] if playbook_name else None
        )
        return False

    # Check if it's in our mapping
    if playbook_name in PLAYBOOK_NAME_TO_PATH:
        return True

    # Log the rejection
    log_secure_info(
        "error",
        "Playbook name not in allowed whitelist",
        playbook_name[:8] if playbook_name else None
    )
    return False


def map_playbook_name_to_path(playbook_name: str) -> Optional[str]:
    """Validate playbook name and map it to the full path.

    Args:
        playbook_name: Name of the playbook file (untrusted input)

    Returns:
        The full path if valid, None if invalid
    """
    # Validate the playbook name
    if not validate_playbook_name(playbook_name):
        return None

    # Map the name to full path
    full_path = PLAYBOOK_NAME_TO_PATH[playbook_name]

    # Return a new string instance to break the taint chain
    return str(full_path)


def validate_job_id(job_id: str) -> bool:
    """Validate job ID format.

    Args:
        job_id: Job identifier

    Returns:
        True if valid, False otherwise
    """
    # Allow UUID format or alphanumeric with hyphens/underscores
    uuid_pattern = r'^[0-9a-f]{8}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{12}$'
    alnum_pattern = r'^[a-zA-Z0-9_-]+$'

    return bool(re.match(uuid_pattern, job_id) or re.match(alnum_pattern, job_id))


def validate_stage_name(stage_name: str) -> bool:
    """Validate stage name to prevent injection.

    Args:
        stage_name: Name of the stage

    Returns:
        True if valid, False otherwise
    """
    # Only allow alphanumeric, spaces, hyphens, and underscores
    pattern = r'^[a-zA-Z0-9 _-]+$'
    return bool(re.match(pattern, stage_name))


def validate_command(cmd: list, playbook_path: str) -> bool:
    """Validate command structure and arguments to prevent injection.

    This function implements strict command allowlisting with rigorous validation
    of each command argument to prevent any possibility of command injection.

    Args:
        cmd: Command list to validate
        playbook_path: Expected playbook path (already validated)

    Returns:
        True if valid, raises ValueError with detailed message if invalid
    """
    # Define the minimum required command structure
    # This defines the exact structure and position of each argument
    MIN_REQUIRED_STRUCTURE = [
        {"value": "podman", "fixed": True},
        {"value": "exec", "fixed": True},
        {"value": "-e", "fixed": True},
        {"value": "ANSIBLE_LOG_PATH=", "prefix": True},  # Only the prefix is fixed, value is validated separately
        {"value": "omnia_core", "fixed": True},
        {"value": "ansible-playbook", "fixed": True},
        {"value": None, "fixed": False},  # playbook_path (validated separately)
    ]

    # Define allowed additional arguments
    ALLOWED_EXTRA_ARGS = [
        "-v",
        "--extra-vars",
        "--inventory"
    ]

    # 1. Check minimum command length
    min_required_length = len(MIN_REQUIRED_STRUCTURE)
    if len(cmd) < min_required_length:
        log_secure_info(
            "error",
            "Command structure too short",
            f"Expected at least {min_required_length}, got {len(cmd)}"
        )
        raise ValueError("Invalid command structure")

    # 2. Structure validation - each argument must match the allowlisted structure
    for i, (arg, allowed) in enumerate(zip(cmd[:min_required_length], MIN_REQUIRED_STRUCTURE)):
        # Type check - must be string
        if not isinstance(arg, str):
            log_secure_info(
                "error",
                "Non-string argument in command",
                f"Position: {i}"
            )
            raise ValueError("Invalid command argument type")

        # Length check - prevent excessively long arguments
        if len(arg) > 4096:  # Reasonable maximum length
            log_secure_info(
                "error",
                "Command argument exceeds maximum allowed length",
                f"Position: {i}, Length: {len(arg)}"
            )
            raise ValueError("Command argument too long")

        # Fixed arguments must match exactly
        if allowed.get("fixed", False) and arg != allowed.get("value", ""):
            log_secure_info(
                "error",
                f"Command argument at position {i} does not match allowlist",
                f"Expected '{allowed.get('value', '')}', got '{arg}'"
            )
            raise ValueError(f"Invalid command argument at position {i}")

        # Arguments with prefix must start with the specified prefix
        if allowed.get("prefix") and not arg.startswith(allowed.get("value", "")):
            log_secure_info(
                "error",
                f"Command argument at position {i} does not start with required prefix",
                f"Expected prefix '{allowed.get('value', '')}', got '{arg}'"
            )
            raise ValueError(f"Invalid command argument prefix at position {i}")

        # Special validation for playbook path
        if not allowed.get("fixed", True) and i == 6:  # playbook_path position
            if arg != playbook_path:
                log_secure_info(
                    "error",
                    "Playbook path in command does not match validated path"
                )
                raise ValueError("Playbook path mismatch")

    # 3. Validate additional arguments (after the minimum required structure)
    if len(cmd) > min_required_length:
        # Check for allowed additional arguments
        i = min_required_length
        while i < len(cmd):
            arg = cmd[i]

            # Check if this is a parameter that takes a value
            if arg in ["--inventory", "--extra-vars"] and i + 1 < len(cmd):
                # Skip the value (next argument)
                i += 2
            elif arg == "-v" or arg.startswith("-v"):
                # Verbosity flag
                i += 1
            else:
                # Unknown argument
                log_secure_info(
                    "error",
                    "Unknown additional argument",
                    f"Position: {i}, Value: {arg}"
                )
                raise ValueError(f"Unknown additional argument: {arg}")

    # 4. Character validation - check for dangerous characters in all arguments
    DANGEROUS_CHARS = ['\n', '\r', '\0', '\t', '\v', '\f', '\a', '\b', '\\', '`', '$', '&', '|', ';', '<', '>', '(', ')', '*', '?', '~', '#']

    # Skip validation for playbook path position and --extra-vars value
    SKIP_POSITIONS = [6]  # Position of playbook_path

    # Find positions of --extra-vars and --inventory values to skip validation
    i = min_required_length
    while i < len(cmd):
        if cmd[i] == "--extra-vars" and i + 1 < len(cmd):
            SKIP_POSITIONS.append(i + 1)  # Skip validating the JSON value
            i += 2
        elif cmd[i] == "--inventory" and i + 1 < len(cmd):
            SKIP_POSITIONS.append(i + 1)  # Skip validating the inventory file path
            i += 2
        else:
            i += 1

    for i, arg in enumerate(cmd):
        # Skip validation for playbook path and --extra-vars value
        if i in SKIP_POSITIONS:
            continue

        for char in DANGEROUS_CHARS:
            if char in arg:
                log_secure_info(
                    "error",
                    "Dangerous character detected in command argument",
                    f"Position: {i}, Character: {repr(char)}"
                )
                raise ValueError("Invalid command argument content")

    # 4. Shell binary check - prevent shell execution
    SHELL_BINARIES = ["sh", "bash", "dash", "zsh", "ksh", "csh", "tcsh", "fish"]
    for i, arg in enumerate(cmd):
        if arg in SHELL_BINARIES:
            log_secure_info(
                "error",
                "Shell binary detected in command argument",
                f"Position: {i}, Value: {arg}"
            )
            raise ValueError("Shell binary not allowed in command")

    # 5. URL check - prevent remote resource fetching
    for i, arg in enumerate(cmd):
        if re.search(r'(https?|ftp|file)://', arg):
            log_secure_info(
                "error",
                "URL detected in command argument",
                f"Position: {i}, Value: {arg[:8]}"
            )
            raise ValueError("URLs not allowed in command arguments")

    return True


# validate_extra_vars function has been removed as we no longer use extra_vars
# This eliminates a potential security vulnerability


def parse_request_file(request_path: Path) -> Optional[Dict[str, Any]]:
    """Parse and validate request file.

    Args:
        request_path: Path to the request JSON file

    Returns:
        Parsed request dictionary or None if invalid
    """
    try:
        # Validate file path to prevent directory traversal
        request_path_str = str(request_path)
        if '..' in request_path_str or not request_path_str.startswith('/'):
            log_secure_info(
                "error",
                "Invalid request file path: possible directory traversal",
                request_path_str[:8]
            )
            return None

        # Ensure file exists and is a regular file
        if not os.path.isfile(request_path):
            log_secure_info(
                "error",
                "Request path is not a regular file",
                request_path_str[:8]
            )
            return None

        with open(request_path, 'r', encoding='utf-8') as f:
            try:
                request_data = json.load(f)
            except json.JSONDecodeError:
                log_secure_info(
                    "error",
                    "Invalid JSON in request file",
                    request_path_str[:8]
                )
                return None

        # Validate data type
        if not isinstance(request_data, dict):
            log_secure_info(
                "error",
                "Request data is not a dictionary",
                request_path_str[:8]
            )
            return None

        # Validate required fields
        required_fields = ["job_id", "stage_name", "playbook_path"]
        missing_fields = [field for field in required_fields if field not in request_data]

        if missing_fields:
            logger.error(
                "Request file missing required fields: %s",
                ', '.join(missing_fields)
            )
            return None

        # Validate inputs to prevent injection
        job_id = str(request_data["job_id"])
        stage_name = str(request_data["stage_name"])
        playbook_name = str(request_data["playbook_path"])  # This is actually the playbook name

        if not validate_job_id(job_id):
            log_secure_info("error", "Invalid job_id format in request", job_id[:8])
            return None

        if not validate_stage_name(stage_name):
            log_secure_info("error", "Invalid stage_name format in request", stage_name[:8])
            return None

        # Map the playbook name to its full path
        # This returns the full path or None if validation fails
        full_playbook_path = map_playbook_name_to_path(playbook_name)
        if full_playbook_path is None:
            log_secure_info("error", "Invalid or unknown playbook name in request", playbook_name[:8])
            return None

        # Set defaults
        request_data.setdefault("correlation_id", job_id)

        # Check for inventory_file_path
        if "inventory_file_path" in request_data:
            inventory_file_path = str(request_data["inventory_file_path"])
            # Validate inventory file path
            if not inventory_file_path.startswith("/") or ".." in inventory_file_path:
                log_secure_info(
                   "error",
                    "Invalid inventory file path: possible directory traversal",
                    job_id[:8]
                )
                return None

            log_secure_info(
                "info",
                "Found inventory file path in request",
                job_id[:8]
            )

        # Check for extra_vars field
        if "extra_vars" in request_data:
            if not isinstance(request_data["extra_vars"], dict):
                log_secure_info("error", "extra_vars must be a dictionary", job_id[:8])
                return None

            log_secure_info(
                "info",
                "Found extra_vars in request",
                job_id[:8]
            )

        # We're no longer using extra_args, so remove it if present
        if "extra_args" in request_data:
            log_secure_info(
                "info",
                "Found extra_args in request but ignoring it",
                job_id[:8]
            )
            # Remove extra_args from request_data
            del request_data["extra_args"]

        # Store both the original playbook name and the mapped full path
        # The full path will be used for command execution
        request_data["playbook_name"] = playbook_name
        request_data["full_playbook_path"] = full_playbook_path

        log_secure_info(
            "info",
            "Parsed request for job",
            job_id
        )
        log_secure_info(
            "debug",
            "Stage name",
            stage_name
        )

        return request_data

    except json.JSONDecodeError as e:
        log_secure_info(
            "error",
            "Invalid JSON in request file"
        )
        return None
    except (KeyError, TypeError, ValueError) as e:
        log_secure_info(
            "error",
            "Error parsing request file"
        )
        return None


def extract_playbook_name(full_playbook_path: str) -> str:
    """Extract the playbook name from the full path.

    Args:
        full_playbook_path: Full path to the playbook file

    Returns:
        The playbook name (filename without path)
    """
    # Get the basename (filename with extension)
    return os.path.basename(full_playbook_path)


def _build_log_paths(playbook_path: str, started_at: datetime) -> tuple:
    """Build host and container log file paths without job_id.

    Args:
        playbook_path: Full path to the playbook file
        started_at: Start time for timestamp

    Returns:
        Tuple of (host_log_file_path, container_log_file_path, host_log_dir)
    """
    # Extract playbook name from the full path
    playbook_name = extract_playbook_name(playbook_path)

    # Create base log directory on NFS share (no job-specific subdirectory)
    host_log_dir = HOST_LOG_BASE_DIR
    host_log_dir.mkdir(parents=True, exist_ok=True)

    # Create log file path with playbook name and timestamp only (no job_id)
    timestamp = started_at.strftime("%Y%m%d_%H%M%S")
    host_log_file_path = host_log_dir / f"{playbook_name}_{timestamp}.log"

    # Container log path (equivalent path in container)
    container_log_file_path = (
        CONTAINER_LOG_BASE_DIR / f"{playbook_name}_{timestamp}.log"
    )

    return host_log_file_path, container_log_file_path, host_log_dir


def move_log_to_job_directory(host_log_file_path: Path, job_id: str) -> Path:
    """Move log file to a job-specific directory after completion.

    Args:
        host_log_file_path: Current path of the log file
        job_id: Job identifier for creating the job directory

    Returns:
        New path of the log file in the job directory
    """
    # Create job-specific directory
    job_dir = HOST_LOG_BASE_DIR / job_id
    job_dir.mkdir(parents=True, exist_ok=True)

    # Get the log filename
    log_filename = host_log_file_path.name

    # New path in job directory
    new_log_path = job_dir / log_filename

    # Move the log file
    try:
        shutil.move(str(host_log_file_path), str(new_log_path))
        log_secure_info(
            "info",
            "Log file moved to job directory",
            job_id[:12] if job_id else ""
        )
    except (OSError, IOError) as e:
        log_secure_info(
            "error",
            "Failed to move log file to job directory"
        )
        # Return original path if move fails
        return host_log_file_path

    return new_log_path


def execute_playbook(request_data: Dict[str, Any]) -> Dict[str, Any]:
    """Execute Ansible playbook and capture results.

    Args:
        request_data: Parsed request dictionary

    Returns:
        Result dictionary with execution details
    """
    job_id = request_data["job_id"]
    stage_name = request_data["stage_name"]
    # Use the full_playbook_path which is the mapped full path from playbook name
    playbook_path = request_data["full_playbook_path"]
    playbook_name = request_data["playbook_name"]  # Original playbook name for logging
    # Use default timeout to prevent potential injection from user input
    timeout_minutes = DEFAULT_TIMEOUT_MINUTES
    correlation_id = request_data.get("correlation_id", job_id)

    log_secure_info(
        "info",
        "Executing playbook for job",
        job_id
    )
    log_secure_info(
        "debug",
        "Stage name",
        stage_name
    )
    log_secure_info(
        "debug",
        "Playbook name",
        playbook_name
    )

    started_at = datetime.now(timezone.utc)
    host_log_file_path, container_log_file_path, _ = _build_log_paths(
        playbook_path, started_at
    )

    # Build podman command to execute playbook in omnia_core container
    # Build command as a list to prevent shell injection
    # Ensure environment variable value is properly sanitized
    log_path_str = str(container_log_file_path)

    # Strict validation for log path
    if not log_path_str.startswith('/') or '..' in log_path_str:
        log_secure_info(
            "error",
            "Container log path must be absolute and cannot contain path traversal",
            log_path_str[:8]
        )
        raise ValueError("Invalid container log path")

    # Validate log path format using regex (alphanumeric, underscore, hyphen, forward slash, and dots)
    if not re.match(r'^[a-zA-Z0-9_\-/.]+$', log_path_str):
        log_secure_info(
            "error",
            "Container log path contains invalid characters",
            log_path_str[:8]
        )
        raise ValueError("Invalid container log path format")

    # Build command as a list to prevent shell injection
    # We no longer use extra_vars to prevent potential command injection
    # This simplifies the code and removes a potential security vulnerability

    # Command structure will be validated by the validate_command function

    # Check if this is a build_image playbook
    # is_build_image = "build_image" in playbook_name

    # Build command as a list with all validated components
    # Each element is a separate argument - no shell interpretation possible
    cmd = [
        "podman", "exec",
        "-e", f"ANSIBLE_LOG_PATH={log_path_str}",
        "omnia_core",
        "ansible-playbook",
        playbook_path  # Validated against strict whitelist
    ]

    # Add inventory file path if present for build_image playbooks
    if "inventory_file_path" in request_data:
        inventory_file_path = str(request_data["inventory_file_path"])
        cmd.extend(["--inventory", inventory_file_path])
        log_secure_info(
            "info",
            "Using inventory file for build_image playbook",
            inventory_file_path[:8]
        )

    # Add extra_vars if present for build_image playbooks
    if "extra_vars" in request_data:
        import json
        extra_vars = request_data["extra_vars"]

        # Convert extra_vars to a JSON string
        extra_vars_json = json.dumps(extra_vars)

        # Add as a single --extra-vars parameter
        cmd.extend(["--extra-vars", extra_vars_json])

        log_secure_info(
            "info",
            "Added extra_vars as JSON for build_image playbook",
            job_id
        )

    # Add verbosity flag
    cmd.append("-v")

    # Use the dedicated command validation function to perform comprehensive validation
    # This includes structure validation, argument validation, and security checks
    try:
        validate_command(cmd, playbook_path)
    except ValueError as e:
        log_secure_info(
            "error",
            "Command validation failed",
            str(e)
        )
        raise ValueError(f"Command validation failed: {e}")

    # Don't log the full command with potentially sensitive paths
    log_secure_info(
        "debug",
        "Executing ansible playbook for job",
        job_id
    )
    log_secure_info(
        "info",
        "Ansible logs will be written to job directory",
        job_id
    )

    try:
        # Execute playbook with timeout and custom log path
        timeout_seconds = timeout_minutes * 60
        # Only set ANSIBLE_LOG_PATH in the environment
        # This is already passed as -e parameter to podman exec
        # No need for a full sanitized environment

        # Log the command being executed (without sensitive details)
        log_secure_info(
            "debug",
            "Executing command",
            f"podman exec omnia_core ansible-playbook [playbook]"
        )

        # Execute with explicit shell=False and validated arguments
        result = subprocess.run(
            cmd,
            capture_output=False,  # Don't capture to avoid duplication with ANSIBLE_LOG_PATH
            timeout=timeout_seconds,
            check=False,
            shell=False,  # Explicitly set shell=False to prevent injection
            text=False,   # Don't interpret output as text to prevent encoding issues
            start_new_session=True  # Isolate the process from the parent session
        )

        # Log file is directly accessible via NFS share, no need to copy
        # Wait a moment for log to be written
        time.sleep(0.5)

        # Verify log file exists
        if host_log_file_path.exists():
            log_secure_info(
                "info",
                "Log file confirmed for job",
                job_id
            )
            # Move log file to job-specific directory after completion
            host_log_file_path = move_log_to_job_directory(host_log_file_path, job_id)
        else:
            log_secure_info(
                "warning",
                "Log file not found at expected location for job",
                job_id
            )

        completed_at = datetime.now(timezone.utc)
        duration_seconds = (completed_at - started_at).total_seconds()

        # Determine status
        status = "success" if result.returncode == 0 else "failed"

        log_secure_info(
            "info",
            "Playbook execution completed for job",
            job_id
        )
        log_secure_info(
            "debug",
            "Execution status",
            status
        )

        # Build result dictionary
        result_data = {
            "job_id": job_id,
            "stage_name": stage_name,
            "request_id": request_data.get("request_id", job_id),
            "correlation_id": correlation_id,
            "status": status,
            "exit_code": result.returncode,
            "log_file_path": str(host_log_file_path),  # Host path to Ansible log file (NFS share)
            "started_at": started_at.isoformat(),
            "completed_at": completed_at.isoformat(),
            "duration_seconds": int(duration_seconds),
            "timestamp": completed_at.isoformat(),
        }

        # Add error details if failed
        if status == "failed":
            result_data["error_code"] = "PLAYBOOK_EXECUTION_FAILED"
            result_data["error_summary"] = f"Playbook exited with code {result.returncode}"

        return result_data

    except subprocess.TimeoutExpired:
        completed_at = datetime.now(timezone.utc)
        duration_seconds = (completed_at - started_at).total_seconds()

        log_secure_info(
            "error",
            "Playbook execution timed out for job",
            job_id
        )

        return {
            "job_id": job_id,
            "stage_name": stage_name,
            "request_id": request_data.get("request_id", job_id),
            "correlation_id": correlation_id,
            "status": "failed",
            "exit_code": -1,
            "stdout": "",
            "stderr": f"Playbook execution timed out after {timeout_minutes} minutes",
            "started_at": started_at.isoformat(),
            "completed_at": completed_at.isoformat(),
            "duration_seconds": int(duration_seconds),
            "error_code": "PLAYBOOK_TIMEOUT",
            "error_summary": f"Execution exceeded timeout of {timeout_minutes} minutes",
            "timestamp": completed_at.isoformat(),
        }

    except (OSError, subprocess.SubprocessError) as e:
        completed_at = datetime.now(timezone.utc)
        duration_seconds = (completed_at - started_at).total_seconds()

        logger.exception(
            "Unexpected error executing playbook for job %s",
            job_id
        )

        return {
            "job_id": job_id,
            "stage_name": stage_name,
            "request_id": request_data.get("request_id", job_id),
            "correlation_id": correlation_id,
            "status": "failed",
            "exit_code": -1,
            "stdout": "",
            "stderr": str(e),
            "started_at": started_at.isoformat(),
            "completed_at": completed_at.isoformat(),
            "duration_seconds": int(duration_seconds),
            "error_code": "SYSTEM_ERROR",
            "error_summary": f"System error during execution: {str(e)}",
            "timestamp": completed_at.isoformat(),
        }

def write_result_file(result_data: Dict[str, Any], original_filename: str) -> bool:
    """Write result file to results directory.

    Args:
        result_data: Result dictionary to write
        original_filename: Original request filename for correlation

    Returns:
        True if successful, False otherwise
    """
    job_id = result_data["job_id"]

    try:
        # Use same filename pattern as request for easy correlation
        result_filename = original_filename
        result_path = RESULTS_DIR / result_filename

        with open(result_path, 'w', encoding='utf-8') as f:
            json.dump(result_data, f, indent=2)

        log_secure_info(
            "info",
            "Wrote result file for job",
            job_id
        )
        return True

    except (OSError, IOError) as e:
        log_secure_info(
            "error",
            "Failed to write result file for job",
            job_id
        )
        return False

def archive_request_file(request_path: Path) -> None:
    """Archive processed request file.

    Args:
        request_path: Path to the request file to archive
    """
    try:
        archive_path = ARCHIVE_DIR / "requests" / request_path.name
        shutil.move(str(request_path), str(archive_path))
        log_secure_info(
            "debug",
            "Archived request file",
            request_path.name[:8] if request_path.name else None
        )
    except (OSError, IOError) as e:
        log_secure_info(
            "warning",
            "Failed to archive request file",
            request_path.name[:8] if request_path.name else None
        )

def process_request(request_path: Path) -> None:
    """Process a single request file.

    This function handles the complete lifecycle of a request:
    1. Move to processing directory (atomic lock)
    2. Parse request
    3. Execute playbook
    4. Write result
    5. Archive request

    Args:
        request_path: Path to the request file
    """
    request_filename = request_path.name
    processing_path = PROCESSING_DIR / request_filename

    with job_semaphore:

        try:
            # Move to processing directory (atomic lock)
            try:
                shutil.move(str(request_path), str(processing_path))
                log_secure_info(
                    "debug",
                    "Moved request to processing",
                    request_filename[:8] if request_filename else None
                )
            except FileNotFoundError:
                # File already moved by another process
                log_secure_info(
                    "debug",
                    "Request already being processed",
                    request_filename[:8] if request_filename else None
                )
                return

            # Parse request
            request_data = parse_request_file(processing_path)
            if not request_data:
                log_secure_info(
                    "error",
                    "Invalid request file",
                    request_filename[:8] if request_filename else None
                )
                # Write error result
                error_result = {
                    "job_id": "unknown",
                    "stage_name": "unknown",
                    "status": "failed",
                    "exit_code": -1,
                    "error_code": "INVALID_REQUEST",
                    "error_summary": "Failed to parse request file",
                    "timestamp": datetime.now(timezone.utc).isoformat(),
                }
                write_result_file(error_result, request_filename)
                archive_request_file(processing_path)
                return

            # Execute playbook
            result_data = execute_playbook(request_data)

            # Write result
            write_result_file(result_data, request_filename)

            # Archive request
            archive_request_file(processing_path)

        finally:
            # Ensure processing file is cleaned up even on error
            if processing_path.exists():
                try:
                    processing_path.unlink()
                except (OSError, IOError) as e:
                    log_secure_info(
                        "warning",
                        "Failed to remove processing file",
                        request_filename[:8] if request_filename else None
                    )

def process_request_async(request_path: Path) -> None:
    """Process request in a separate thread.

    Args:
        request_path: Path to the request file
    """
    thread = Thread(target=process_request, args=(request_path,), daemon=True)
    thread.start()

def scan_and_process_requests() -> int:
    """Scan requests directory and process new requests.

    Returns:
        Number of requests processed
    """
    try:
        request_files = sorted(REQUESTS_DIR.glob("*.json"))

        if not request_files:
            return 0

        log_secure_info(
            "debug",
            "Found request files",
            str(len(request_files))
        )

        processed_count = 0
        for request_path in request_files:
            if SHUTDOWN_REQUESTED:
                log_secure_info(
                    "info",
                    "Shutdown requested"
                )
                break

            try:
                # Process asynchronously
                process_request_async(request_path)
                processed_count += 1
            except (OSError, IOError) as e:
                log_secure_info(
                    "error",
                    "Error processing request",
                    request_path.name[:8] if request_path.name else None
                )

        return processed_count

    except (OSError, IOError) as e:
        log_secure_info(
            "error",
            "Error scanning requests directory"
        )
        return 0

def run_watcher_loop():
    """Main watcher loop that continuously polls for requests."""
    log_secure_info(
        "info",
        "Starting Playbook Watcher Service"
    )
    log_secure_info(
        "info",
        "Queue base directory"
    )
    log_secure_info(
        "info",
        f"Poll interval: {POLL_INTERVAL_SECONDS}s"
    )
    log_secure_info(
        "info",
        f"Max concurrent jobs: {MAX_CONCURRENT_JOBS}"
    )
    log_secure_info(
        "info",
        f"Max concurrent jobs: {MAX_CONCURRENT_JOBS}"
    )
    log_secure_info(
        "info",
        f"Default timeout: {DEFAULT_TIMEOUT_MINUTES}m"
    )

    # Ensure directories exist
    try:
        ensure_directories()
    except (OSError, IOError) as e:
        log_secure_info(
            "critical",
            "Failed to initialize directories"
        )
        sys.exit(1)

    # Main loop
    iteration = 0
    while not SHUTDOWN_REQUESTED:
        iteration += 1

        try:
            processed_count = scan_and_process_requests()

            if processed_count > 0:
                log_secure_info(
                    "info",
                    "Processed requests in iteration",
                    str(processed_count)
                )

        except RuntimeError as e:
            logger.exception(
                "Unexpected error in watcher loop iteration %d",
                iteration
            )

        # Sleep before next poll
        time.sleep(POLL_INTERVAL_SECONDS)

    log_secure_info(
        "info",
        "Playbook Watcher Service stopped"
    )

def main():
    """Main entry point for the watcher service."""
    # Register signal handlers
    signal.signal(signal.SIGTERM, signal_handler)
    signal.signal(signal.SIGINT, signal_handler)

    try:
        run_watcher_loop()
    except KeyboardInterrupt:
        log_secure_info(
            "info",
            "Received keyboard interrupt"
        )
    except (RuntimeError, OSError):
        log_secure_info(
            "critical",
            "Fatal error in watcher service"
        )
        sys.exit(1)

    sys.exit(0)

if __name__ == "__main__":
    main()


================================================
FILE: build_stream/pytest.ini
================================================
[pytest]
pythonpath = .
testpaths = tests
python_files = test_*.py
python_classes = Test*
python_functions = test_*
markers =
    unit: marks tests as unit tests
    integration: marks tests as integration tests
    e2e: marks tests as end-to-end tests
env =
    ENV = dev
    TEST_DATABASE_URL = postgresql://admin:dell1234@localhost:5432/build_stream_db
    DATABASE_URL = postgresql://admin:dell1234@localhost:5432/build_stream_db


================================================
FILE: build_stream/requirements-dev.txt
================================================
# Development and testing dependencies for Build Stream API
# Install with: pip install -r requirements-dev.txt

# Testing framework
pytest>=7.4.0
pytest-asyncio>=0.21.0
pytest-cov>=4.1.0

# HTTP client for FastAPI testing
httpx>=0.25.0

# Code quality
pylint>=3.0.0
black>=23.0.0
isort>=5.12.0


================================================
FILE: build_stream/requirements.txt
================================================
# Core dependencies for Build Stream API
# Install with: pip install -r requirements.txt

# Web framework
fastapi>=0.104.0
uvicorn>=0.24.0
pydantic>=2.5.0

# Authentication
PyJWT>=2.8.0
cryptography>=41.0.0
argon2-cffi>=23.1.0

# Dependency injection
dependency-injector>=4.41.0

# Vault integration
pyyaml>=6.0.0
ansible>=8.0.0

# Form data handling
python-multipart>=0.0.6

# HTTP client
httpx>=0.25.0

# JSON Schema validation
jsonschema>=4.20.0

# Database
sqlalchemy>=2.0.0
psycopg2-binary>=2.9.0
alembic>=1.13.0


================================================
FILE: build_stream/scripts/generate_jwt_keys.sh
================================================
#!/bin/bash
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

# Generate RSA key pair for JWT signing
#
# This script generates a 4096-bit RSA key pair for signing JWT tokens.
# The keys are stored in the specified directory with appropriate permissions.
#
# Usage:
#   ./generate_jwt_keys.sh [output_directory]
#
# Default output directory: /etc/omnia/keys

set -euo pipefail

# Configuration
KEY_SIZE=4096
PRIVATE_KEY_NAME="jwt_private.pem"
PUBLIC_KEY_NAME="jwt_public.pem"
DEFAULT_OUTPUT_DIR="/opt/omnia/build_stream_root/api/.auth/keys"

# Parse arguments
OUTPUT_DIR="${1:-$DEFAULT_OUTPUT_DIR}"

# Colors for output
RED='\033[0;31m'
GREEN='\033[0;32m'
YELLOW='\033[1;33m'
NC='\033[0m' # No Color

log_info() {
    echo -e "${GREEN}[INFO]${NC} $1"
}

log_warn() {
    echo -e "${YELLOW}[WARN]${NC} $1"
}

log_error() {
    echo -e "${RED}[ERROR]${NC} $1"
}

# Check if openssl is available
if ! command -v openssl &> /dev/null; then
    log_error "openssl is required but not installed."
    exit 1
fi

# Create output directory if it doesn't exist
if [ ! -d "$OUTPUT_DIR" ]; then
    log_info "Creating output directory: $OUTPUT_DIR"
    mkdir -p "$OUTPUT_DIR"
fi

PRIVATE_KEY_PATH="$OUTPUT_DIR/$PRIVATE_KEY_NAME"
PUBLIC_KEY_PATH="$OUTPUT_DIR/$PUBLIC_KEY_NAME"

# Check if keys already exist
if [ -f "$PRIVATE_KEY_PATH" ] || [ -f "$PUBLIC_KEY_PATH" ]; then
    log_warn "JWT keys already exist in $OUTPUT_DIR"
    read -p "Do you want to overwrite them? (y/N): " -n 1 -r
    echo
    if [[ ! $REPLY =~ ^[Yy]$ ]]; then
        log_info "Key generation cancelled."
        exit 0
    fi
    log_warn "Overwriting existing keys..."
fi

log_info "Generating $KEY_SIZE-bit RSA private key..."
openssl genrsa -out "$PRIVATE_KEY_PATH" "$KEY_SIZE" 2>/dev/null

if [ $? -ne 0 ]; then
    log_error "Failed to generate private key"
    exit 1
fi

log_info "Extracting public key..."
openssl rsa -in "$PRIVATE_KEY_PATH" -pubout -out "$PUBLIC_KEY_PATH" 2>/dev/null

if [ $? -ne 0 ]; then
    log_error "Failed to extract public key"
    rm -f "$PRIVATE_KEY_PATH"
    exit 1
fi

# Set secure permissions
log_info "Setting secure permissions..."
chmod 600 "$PRIVATE_KEY_PATH"  # Owner read/write only
chmod 644 "$PUBLIC_KEY_PATH"   # Owner read/write, others read

# Verify the keys
log_info "Verifying key pair..."
VERIFY_RESULT=$(openssl rsa -in "$PRIVATE_KEY_PATH" -check 2>&1)
if echo "$VERIFY_RESULT" | grep -q "RSA key ok"; then
    log_info "Key verification successful"
else
    log_error "Key verification failed"
    exit 1
fi

# Display key information
log_info "JWT keys generated successfully!"
echo ""
echo "Key Details:"
echo "  Private Key: $PRIVATE_KEY_PATH"
echo "  Public Key:  $PUBLIC_KEY_PATH"
echo "  Key Size:    $KEY_SIZE bits"
echo "  Algorithm:   RS256 (RSA with SHA-256)"
echo ""
echo "Environment Variables (add to your configuration):"
echo "  export JWT_PRIVATE_KEY_PATH=\"$PRIVATE_KEY_PATH\""
echo "  export JWT_PUBLIC_KEY_PATH=\"$PUBLIC_KEY_PATH\""
echo ""
echo "Key Rotation Recommendations:"
echo "  - Rotate keys every 365 days for production environments"
echo "  - Keep backup of old public key for token validation during rotation"
echo "  - Update JWT_KEY_ID environment variable when rotating keys"
echo ""
log_warn "IMPORTANT: Keep the private key secure and never commit it to version control!"


================================================
FILE: build_stream/tests/README.md
================================================
# Build Stream Test Suite

This directory contains comprehensive unit and integration tests for all Build Stream workflows including Jobs API, Catalog Processing, Local Repository, Image Building, and Validation.

## Test Structure

```
tests/
├── integration/                # Integration tests for end-to-end workflows
│   ├── api/                   # API endpoint integration tests
│   │   ├── jobs/              # Jobs API tests
│   │   │   ├── conftest.py                    # Shared fixtures
│   │   │   ├── test_create_job_api.py         # POST /jobs tests
│   │   │   ├── test_get_job_api.py            # GET /jobs/{id} tests
│   │   │   └── test_delete_job_api.py         # DELETE /jobs/{id} tests
│   │   ├── catalog_roles/     # Catalog processing tests
│   │   │   ├── conftest.py                    # Shared fixtures
│   │   │   ├── test_get_roles_api.py          # GET /catalog_roles tests
│   │   │   └── test_catalog_workflow.py       # End-to-end catalog tests
│   │   ├── parse_catalog/     # Catalog parsing tests
│   │   │   ├── conftest.py                    # Shared fixtures
│   │   │   └── test_parse_catalog_api.py      # POST /parse_catalog tests
│   │   ├── local_repo/        # Local repository tests
│   │   │   ├── conftest.py                    # Shared fixtures
│   │   │   ├── test_create_local_repo_api.py  # POST /local_repo tests
│   │   │   └── test_repo_workflow.py          # End-to-end repo tests
│   │   ├── build_image/       # Image building tests
│   │   │   ├── conftest.py                    # Shared fixtures
│   │   │   ├── test_build_image_api.py        # POST /build_image tests
│   │   │   └── test_multi_arch_build.py       # Multi-architecture tests
│   │   └── validate/          # Validation tests
│   │       ├── conftest.py                    # Shared fixtures
│   │       └── test_validate_api.py           # POST /validate tests
│   ├── core/                  # Core domain integration tests
│   │   ├── jobs/              # Job entity integration tests
│   │   ├── catalog/           # Catalog entity integration tests
│   │   └── localrepo/         # Repository entity integration tests
│   └── infra/                 # Infrastructure integration tests
│       ├── repositories/      # Repository integration tests
│       └── external/          # External service integration tests
├── unit/                      # Unit tests for individual components
│   ├── api/                   # API layer unit tests
│   │   ├── jobs/              # Jobs API unit tests
│   │   │   ├── test_schemas.py                # Pydantic schema tests
│   │   │   ├── test_dependencies.py           # Dependency injection tests
│   │   │   └── test_routes.py                 # Route handler tests
│   │   ├── catalog_roles/     # Catalog API unit tests
│   │   ├── local_repo/        # Local repo API unit tests
│   │   └── validate/          # Validation API unit tests
│   ├── core/                  # Core domain unit tests
│   │   ├── jobs/              # Job entity and value object tests
│   │   ├── catalog/           # Catalog entity tests
│   │   ├── localrepo/         # Repository entity tests
│   │   └── validate/          # Validation entity tests
│   ├── orchestrator/          # Use case unit tests
│   │   ├── jobs/              # Job use case tests
│   │   ├── catalog/           # Catalog use case tests
│   │   ├── local_repo/        # Repository use case tests
│   │   └── validate/          # Validation use case tests
│   └── infra/                 # Infrastructure unit tests
│       ├── repositories/      # Repository implementation tests
│       ├── artifact_store/    # Artifact store tests
│       └── db/                # Database layer tests
├── end_to_end/                # Complete workflow tests
│   ├── test_full_job_workflow.py              # Complete job lifecycle
│   └── test_catalog_to_image.py               # Catalog to image workflow
├── performance/               # Performance and load tests
│   └── test_load.py           # Load testing scenarios
├── fixtures/                  # Shared test fixtures
│   ├── job_fixtures.py        # Job test data
│   └── repo_fixtures.py       # Repository test data
├── mocks/                     # Mock objects and data
│   ├── mock_vault.py          # Vault mock
│   └── mock_registry.py       # Registry mock
└── utils/                     # Test utilities and helpers
    ├── assertions.py          # Custom assertions
    └── helpers.py             # Test helper functions
```

## Prerequisites

Install test dependencies:

```bash
pip install -r requirements.txt
```

Required packages:
- pytest>=7.4.0
- pytest-asyncio>=0.21.0
- httpx>=0.24.0
- pytest-cov>=4.1.0

## Running Tests

### Run All Tests

```bash
# Run all tests
pytest tests/ -v

# Run with coverage
pytest tests/ --cov=api --cov=orchestrator --cov-report=html
```

### Run Specific Test Suites

```bash
# Integration tests only
pytest tests/integration/ -v

# Unit tests only
pytest tests/unit/ -v

# API tests only
pytest tests/integration/api/ tests/unit/api/ -v
```

### Run Specific Test Files

```bash
# Jobs API tests
pytest tests/integration/api/jobs/test_create_job_api.py -v

# Catalog processing tests
pytest tests/integration/api/catalog_roles/ -v

# Local repository tests
pytest tests/integration/api/local_repo/ -v

# Image building tests
pytest tests/integration/api/build_image/ -v

# Validation tests
pytest tests/integration/api/validate/ -v

# Schema validation tests
pytest tests/unit/api/jobs/test_schemas.py -v

# Use case tests
pytest tests/unit/orchestrator/ -v
```

### Run Specific Test Classes or Functions

```bash
# Run specific test class
pytest tests/integration/api/jobs/test_create_job_api.py::TestCreateJobSuccess -v

# Run specific test function
pytest tests/integration/api/jobs/test_create_job_api.py::TestCreateJobSuccess::test_create_job_returns_201_with_valid_request -v

# Run tests matching pattern
pytest tests/integration/ -k idempotency -v
```

## Test Types

### Unit Tests
Test individual components in isolation:
- **API Layer**: Route handlers, schemas, dependencies
- **Core Layer**: Entities, value objects, domain services
- **Orchestrator Layer**: Use cases and business logic
- **Infrastructure Layer**: Repositories, external integrations

### Integration Tests
Test component interactions:
- **API Integration**: Full HTTP request/response cycles
- **Database Integration**: Repository operations with real DB
- **External Services**: Vault, Pulp, container registries
- **Cross-Layer**: API → Use Case → Repository flows

### End-to-End Tests
Test complete workflows from start to finish:
- Full job creation and execution
- Catalog parsing through role generation
- Repository creation and package sync
- Image building and registry push

### Performance Tests
Test system performance and scalability:
- Load testing for concurrent requests
- Stress testing for resource limits
- Benchmark tests for critical operations

## Workflow-Specific Tests

### Jobs Workflow Tests
```bash
# All jobs tests
pytest tests/integration/api/jobs/ tests/unit/orchestrator/jobs/ -v

# Job creation and idempotency
pytest tests/integration/api/jobs/test_create_job_api.py -v

# Job lifecycle management
pytest tests/integration/api/jobs/test_get_job_api.py -v
```

### Catalog Workflow Tests
```bash
# All catalog tests
pytest tests/integration/api/catalog_roles/ tests/unit/core/catalog/ -v

# Catalog parsing
pytest tests/integration/api/parse_catalog/ -v

# Role generation
pytest tests/unit/orchestrator/catalog/ -v
```

### Local Repository Workflow Tests
```bash
# All local repo tests
pytest tests/integration/api/local_repo/ tests/unit/core/localrepo/ -v

# Repository creation
pytest tests/integration/api/local_repo/test_create_local_repo.py -v
```

### Image Building Workflow Tests
```bash
# All build image tests
pytest tests/integration/api/build_image/ tests/unit/core/build_image/ -v

# Multi-architecture builds
pytest tests/integration/api/build_image/ -k multi_arch -v
```

### Validation Workflow Tests
```bash
# All validation tests
pytest tests/integration/api/validate/ tests/unit/core/validate/ -v

# Schema validation
pytest tests/unit/core/validate/ -k schema -v
```

## Test Fixtures

### Shared Fixtures (conftest.py)

**Authentication & Authorization:**
- `client`: FastAPI TestClient with dev container
- `auth_headers`: Standard authentication headers
- `admin_auth_headers`: Admin-level authentication

**Idempotency & Correlation:**
- `unique_idempotency_key`: Unique key per test
- `unique_correlation_id`: Unique correlation ID per test

**Database & Storage:**
- `db_session`: Database session for tests
- `clean_db`: Fresh database for each test
- `artifact_store`: Test artifact storage

**Mock Services:**
- `mock_vault_client`: Mocked Vault integration
- `mock_pulp_client`: Mocked Pulp integration
- `mock_registry_client`: Mocked container registry

### Usage Example

```python
def test_create_job(client, auth_headers, unique_idempotency_key):
    """Test job creation with idempotency."""
    payload = {
        "catalog_uri": "s3://bucket/catalog.json",
        "idempotency_key": unique_idempotency_key
    }
    response = client.post("/api/v1/jobs", json=payload, headers=auth_headers)
    assert response.status_code == 201
    assert "job_id" in response.json()
```

## Coverage Report

Generate HTML coverage report:

```bash
pytest tests/ --cov=api --cov=orchestrator --cov-report=html
```

View report:
```bash
# Open htmlcov/index.html in browser
```

## CI/CD Integration

Add to GitHub Actions workflow:

```yaml
- name: Run Tests
  run: |
    pip install -r requirements.txt
    pytest tests/ --cov=api --cov=orchestrator --cov-report=xml

- name: Upload Coverage
  uses: codecov/codecov-action@v3
  with:
    file: ./coverage.xml
```

## Test Best Practices

### Test Design Principles

1. **Isolation**: Each test is independent and can run in any order
   - Use unique idempotency keys and correlation IDs
   - Clean up resources after each test
   - Avoid shared mutable state

2. **Fast Execution**: Tests should complete quickly
   - Unit tests: <100ms each
   - Integration tests: <5 seconds each
   - Use mocks for external dependencies

3. **Deterministic**: Tests produce consistent results
   - No flaky tests or race conditions
   - Avoid time-dependent logic
   - Use fixed test data

4. **Clear Naming**: Follow descriptive naming conventions
   - Pattern: `test_<action>_<condition>_<expected_result>`
   - Example: `test_create_job_with_invalid_catalog_returns_400`

5. **Comprehensive Coverage**: Test all scenarios
   - Happy path (success cases)
   - Error cases (validation failures, exceptions)
   - Edge cases (boundary conditions)
   - Security (authentication, authorization)

### Test Organization

**Arrange-Act-Assert Pattern:**
```python
def test_example():
    # Arrange: Set up test data and preconditions
    payload = {"catalog_uri": "s3://bucket/catalog.json"}
    
    # Act: Execute the operation being tested
    response = client.post("/api/v1/jobs", json=payload)
    
    # Assert: Verify the expected outcome
    assert response.status_code == 201
    assert "job_id" in response.json()
```

**Test Grouping:**
- Group related tests in classes
- Use descriptive class names (e.g., `TestCreateJobSuccess`, `TestCreateJobValidation`)
- Share setup/teardown logic within classes

### Security Testing

**Authentication Tests:**
- Test endpoints without authentication (should return 401)
- Test with invalid tokens (should return 401)
- Test with expired tokens (should return 401)

**Authorization Tests:**
- Test with insufficient permissions (should return 403)
- Test role-based access control
- Verify resource ownership checks

**Input Validation:**
- Test SQL injection attempts
- Test XSS payloads
- Test path traversal attempts
- Test oversized inputs

### Mocking Guidelines

**When to Mock:**
- External HTTP APIs (Vault, Pulp, registries)
- File system operations (for unit tests)
- Time-dependent operations
- Expensive computations

**When NOT to Mock:**
- Database operations (use test database)
- Core business logic
- Internal service calls
- Simple utility functions

### Code Coverage Goals

- **Overall**: >80% code coverage
- **Core Domain**: >90% coverage
- **API Routes**: >85% coverage
- **Use Cases**: >90% coverage
- **Critical Paths**: 100% coverage

## Troubleshooting

### Tests Fail with "Module not found"

```bash
# Ensure you're in the correct directory
cd build_stream/

# Run with Python path
PYTHONPATH=. pytest tests/
```

### Tests Fail with Container Issues

```bash
# Set ENV to dev
export ENV=dev  # Linux/Mac
set ENV=dev     # Windows CMD
$env:ENV = "dev"  # Windows PowerShell

pytest tests/
```

### Slow Test Execution

```bash
# Run tests in parallel
pip install pytest-xdist
pytest tests/ -n auto
```

### Database Connection Issues

```bash
# Ensure PostgreSQL is running
# Check connection settings in environment variables

# For Windows PowerShell
$env:DATABASE_URL = "postgresql://user:password@localhost:5432/build_stream_test"

# For Linux/Mac
export DATABASE_URL="postgresql://user:password@localhost:5432/build_stream_test"

# Run migrations
alembic upgrade head

# Run tests
pytest tests/
```

### Authentication Failures

```bash
# Verify Vault is accessible (if using real Vault)
# Or ensure mock Vault is configured

# Check JWT token configuration
# Verify environment variables are set correctly
```

## Environment Configuration

### Required Environment Variables

For running tests, configure the following environment variables:

**Windows PowerShell:**
```powershell
$env:ENV = "dev"
$env:HOST = "0.0.0.0"
$env:PORT = "8000"
$env:DATABASE_URL = "postgresql://user:password@localhost:5432/build_stream_test"
$env:LOG_LEVEL = "DEBUG"
```

**Linux/Mac:**
```bash
export ENV=dev
export HOST=0.0.0.0
export PORT=8000
export DATABASE_URL=postgresql://user:password@localhost:5432/build_stream_test
export LOG_LEVEL=DEBUG
```

### Test Database Setup

```bash
# Create test database
createdb build_stream_test

# Run migrations
alembic upgrade head

# Verify database
psql build_stream_test -c "\dt"
```

## Writing New Tests

### Adding a New Unit Test

1. Create test file in appropriate `tests/unit/` subdirectory
2. Import required modules and fixtures
3. Write test functions following naming conventions
4. Use mocks for external dependencies
5. Run tests to verify

**Example:**
```python
# tests/unit/core/jobs/test_job_entity.py
import pytest
from core.jobs.entities import Job
from core.jobs.value_objects import JobId, StageName

def test_job_creation_with_valid_data():
    """Test job entity creation with valid data."""
    job_id = JobId.generate()
    job = Job(job_id=job_id, client_id="test-client")
    
    assert job.job_id == job_id
    assert job.client_id == "test-client"
    assert job.status == "pending"
```

### Adding a New Integration Test

1. Create test file in appropriate `tests/integration/` subdirectory
2. Use shared fixtures from conftest.py
3. Test full request/response cycles
4. Verify database state changes
5. Clean up test data

**Example:**
```python
# tests/integration/api/jobs/test_create_job_integration.py
def test_create_job_integration(client, auth_headers, unique_idempotency_key):
    """Test complete job creation flow."""
    payload = {
        "catalog_uri": "s3://test-bucket/catalog.json",
        "idempotency_key": unique_idempotency_key
    }
    
    response = client.post("/api/v1/jobs", json=payload, headers=auth_headers)
    
    assert response.status_code == 201
    data = response.json()
    assert "job_id" in data
    assert data["status"] == "pending"
```

## Continuous Integration

### GitHub Actions Example

```yaml
name: Test Suite

on: [push, pull_request]

jobs:
  test:
    runs-on: ubuntu-latest
    
    services:
      postgres:
        image: postgres:15
        env:
          POSTGRES_PASSWORD: postgres
          POSTGRES_DB: build_stream_test
        options: >-
          --health-cmd pg_isready
          --health-interval 10s
          --health-timeout 5s
          --health-retries 5
    
    steps:
      - uses: actions/checkout@v3
      
      - name: Set up Python
        uses: actions/setup-python@v4
        with:
          python-version: '3.11'
      
      - name: Install dependencies
        run: |
          pip install -r requirements.txt
          pip install -r requirements-dev.txt
      
      - name: Run tests
        env:
          ENV: dev
          DATABASE_URL: postgresql://postgres:postgres@localhost:5432/build_stream_test
        run: |
          pytest tests/ -v --cov=api --cov=orchestrator --cov=core --cov-report=xml
      
      - name: Upload coverage
        uses: codecov/codecov-action@v3
        with:
          file: ./coverage.xml
```

## Additional Resources

- [Main Build Stream README](../README.md) - Architecture and getting started
- [Developer Guide](../doc/developer-guide.md) - Comprehensive development guide
- [Workflow Documentation](../doc/) - Detailed workflow guides
- [pytest Documentation](https://docs.pytest.org/) - pytest framework reference
- [FastAPI Testing](https://fastapi.tiangolo.com/tutorial/testing/) - FastAPI testing guide


================================================
FILE: build_stream/tests/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


================================================
FILE: build_stream/tests/conftest.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Shared pytest fixtures for Build Stream API tests.

Note: This conftest is for mock-based unit/integration tests.
E2E integration tests use tests/integration/conftest.py which does not
import the app directly (it runs the server as a subprocess).
"""

# pylint: disable=redefined-outer-name,global-statement,import-outside-toplevel,protected-access

import base64
import os
import sys
from pathlib import Path
from typing import Dict, Generator

import pytest

# Set DATABASE_URL early for test environment
os.environ.setdefault("DATABASE_URL", "sqlite:///:memory:")

# Patch JWT exceptions for compatibility with newer PyJWT versions
# This must be done before any imports of jwt.exceptions
import jwt.exceptions
if not hasattr(jwt.exceptions, 'DecodeError'):
    jwt.exceptions.DecodeError = jwt.exceptions.JWTDecodeError
if not hasattr(jwt.exceptions, 'ExpiredSignatureError'):
    class ExpiredSignatureError(jwt.exceptions.JWTDecodeError):
        """Alias for expired signature errors."""
    jwt.exceptions.ExpiredSignatureError = ExpiredSignatureError
if not hasattr(jwt.exceptions, 'InvalidAudienceError'):
    class InvalidAudienceError(jwt.exceptions.JWTDecodeError):
        """Alias for invalid audience errors."""
    jwt.exceptions.InvalidAudienceError = InvalidAudienceError
if not hasattr(jwt.exceptions, 'InvalidIssuerError'):
    class InvalidIssuerError(jwt.exceptions.JWTDecodeError):
        """Alias for invalid issuer errors."""
    jwt.exceptions.InvalidIssuerError = InvalidIssuerError
if not hasattr(jwt.exceptions, 'InvalidSignatureError'):
    class InvalidSignatureError(jwt.exceptions.JWTDecodeError):
        """Alias for invalid signature errors."""
    jwt.exceptions.InvalidSignatureError = InvalidSignatureError

# Note: pythonpath is set in pytest.ini at project root

# Lazy imports to avoid triggering FastAPI route registration
# when running E2E tests that don't need these fixtures
_APP = None
_AUTH_SERVICE = None
_AUTH_ROUTES = None
_MOCK_VAULT_CLIENT = None


def _get_app():
    """Lazy import of FastAPI app."""
    global _APP
    if _APP is None:
        from main import app  # noqa: PLC0415
        _APP = app
    return _APP


def _get_auth_service():
    """Lazy import of AuthService."""
    global _AUTH_SERVICE
    if _AUTH_SERVICE is None:
        from api.auth.service import AuthService  # noqa: PLC0415
        _AUTH_SERVICE = AuthService
    return _AUTH_SERVICE


def _get_auth_routes():
    """Lazy import of auth routes."""
    global _AUTH_ROUTES
    if _AUTH_ROUTES is None:
        from api.auth import routes as auth_routes  # noqa: PLC0415
        _AUTH_ROUTES = auth_routes
    return _AUTH_ROUTES


def _get_mock_vault_client():
    """Lazy import of MockVaultClient."""
    global _MOCK_VAULT_CLIENT
    if _MOCK_VAULT_CLIENT is None:
        from tests.mocks.mock_vault_client import MockVaultClient  # noqa: PLC0415
        _MOCK_VAULT_CLIENT = MockVaultClient
    return _MOCK_VAULT_CLIENT


_MOCK_JWT_HANDLER = None


def _get_mock_jwt_handler():
    """Lazy import of MockJWTHandler."""
    global _MOCK_JWT_HANDLER
    if _MOCK_JWT_HANDLER is None:
        from tests.mocks.mock_jwt_handler import MockJWTHandler  # noqa: PLC0415
        _MOCK_JWT_HANDLER = MockJWTHandler
    return _MOCK_JWT_HANDLER


@pytest.fixture
def mock_vault_client():
    """Create a fresh MockVaultClient instance.

    Returns:
        MockVaultClient with default test credentials.
    """
    mock_vault_client = _get_mock_vault_client()
    return mock_vault_client()


@pytest.fixture
def mock_vault_with_client(mock_vault_client):  # noqa: W0621
    """Create a MockVaultClient with an existing registered client.

    Args:
        mock_vault_client: Base mock vault client.

    Returns:
        MockVaultClient with one pre-registered client.
    """
    mock_vault_client.add_test_client()
    return mock_vault_client


@pytest.fixture
def auth_service(mock_vault_client):  # noqa: W0621
    """Create an AuthService with mock vault client.

    Args:
        mock_vault_client: Mock vault client fixture.

    Returns:
        AuthService configured with mock vault.
    """
    auth_service_class = _get_auth_service()
    return auth_service_class(vault_client=mock_vault_client)


@pytest.fixture
def mock_jwt_handler():
    """Create a fresh MockJWTHandler instance.

    Returns:
        MockJWTHandler for testing JWT operations.
    """
    mock_jwt_handler = _get_mock_jwt_handler()
    return mock_jwt_handler()


@pytest.fixture
def test_client(mock_vault_client, mock_jwt_handler) -> Generator:  # noqa: W0621
    """Create a FastAPI TestClient with mocked dependencies.

    Args:
        mock_vault_client: Mock vault client fixture.
        mock_jwt_handler: Mock JWT handler fixture.

    Yields:
        TestClient configured for testing.
    """
    from fastapi.testclient import TestClient  # noqa: PLC0415
    from api.auth.routes import get_auth_service  # noqa: PLC0415

    app = _get_app()
    auth_service_class = _get_auth_service()

    test_auth_service = auth_service_class(
        vault_client=mock_vault_client,
        jwt_handler=mock_jwt_handler,
    )

    # Override the dependency injection
    app.dependency_overrides[get_auth_service] = lambda: test_auth_service

    with TestClient(app) as client:
        yield client

    # Clean up dependency overrides
    app.dependency_overrides.clear()


@pytest.fixture
def test_client_with_existing_client(  # noqa: C0301,W0621
        mock_vault_with_client, mock_jwt_handler
    ) -> Generator:
    """Create a TestClient with a pre-registered client in vault.

    Args:
        mock_vault_with_client: Mock vault with existing client.
        mock_jwt_handler: Mock JWT handler fixture.

    Yields:
        TestClient configured for testing max client scenarios.
    """
    from fastapi.testclient import TestClient  # noqa: PLC0415
    from api.auth.routes import get_auth_service  # noqa: PLC0415

    app = _get_app()
    auth_service_class = _get_auth_service()

    test_auth_service = auth_service_class(
        vault_client=mock_vault_with_client,
        jwt_handler=mock_jwt_handler,
    )

    # Override the dependency injection
    app.dependency_overrides[get_auth_service] = lambda: test_auth_service

    with TestClient(app) as client:
        yield client

    # Clean up dependency overrides
    app.dependency_overrides.clear()


@pytest.fixture
def valid_auth_header() -> Dict[str, str]:
    """Create valid Basic Auth header for registration endpoint.

    Returns:
        Dictionary with Authorization header.
    """
    mock_vault_client_class = _get_mock_vault_client()
    username = mock_vault_client_class.DEFAULT_TEST_USERNAME
    password = mock_vault_client_class.DEFAULT_TEST_PASSWORD
    credentials = base64.b64encode(
        f"{username}:{password}".encode()
    ).decode()
    return {"Authorization": f"Basic {credentials}"}


@pytest.fixture
def invalid_auth_header() -> Dict[str, str]:
    """Create invalid Basic Auth header.

    Returns:
        Dictionary with invalid Authorization header.
    """
    credentials = base64.b64encode(b"wrong_user:wrong_password").decode()
    return {"Authorization": f"Basic {credentials}"}


@pytest.fixture
def valid_registration_request() -> Dict:
    """Create a valid client registration request body.

    Returns:
        Dictionary with valid registration data.
    """
    return {
        "client_name": "test-client-01",
        "description": "Test client for unit tests",
        "allowed_scopes": ["catalog:read", "catalog:write"],
    }


@pytest.fixture
def minimal_registration_request() -> Dict:
    """Create a minimal valid registration request (only required fields).

    Returns:
        Dictionary with minimal registration data.
    """
    return {
        "client_name": "minimal-client",
    }


@pytest.fixture
def valid_token_request() -> Dict:
    """Create a valid token request body template.

    Note: client_id and client_secret must be filled in after registration.

    Returns:
        Dictionary with token request template.
    """
    return {
        "grant_type": "client_credentials",
        "client_id": None,
        "client_secret": None,
    }


def generate_test_client_secret() -> str:
    """Generate a test client secret that is different from the valid one.
    
    Returns:
        Invalid client secret string for testing (valid format, wrong value).
    """
    return "bld_s_invalid_test_secret_12345"


def generate_invalid_client_id() -> str:
    """Generate an invalid client ID for testing.
    
    Returns:
        Invalid client ID string (contains invalid characters).
    """
    return "invalid@client#id"


def generate_invalid_client_secret() -> str:
    """Generate an invalid client secret for testing.
    
    Returns:
        Invalid client secret string (too short).
    """
    return "short"


================================================
FILE: build_stream/tests/demo/buildstream_demo.py
================================================
#!/usr/bin/env python3

# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Complete Parse-Catalog Demo with Real API Calls.

This script demonstrates the full parse-catalog workflow by:
1. Making actual API calls using requests
2. Using the real catalog_rhel.json file
3. Showing all responses and generated artifacts
4. Interactive step-by-step execution with user confirmation

Usage:
    python buildstream_demo.py                           # Register new client
    python buildstream_demo.py --cleanup                  # Clean artifacts and register new client
    python buildstream_demo.py --help                     # Show options

    Note: Update the Configuration constants in code as per your configuration
"""

import argparse
import base64
import json
import shutil
import subprocess
import time
import uuid
from pathlib import Path
import urllib3

import requests

# Disable SSL warnings
urllib3.disable_warnings(urllib3.exceptions.InsecureRequestWarning)

# Configuration constants
BASE_URL = "https://182.10.5.157:8010"
CLIENT_NAME = "demo-client"
AUTH_USERNAME = "admin"
AUTH_PASSWORD = ""
CREDENTIALS_FILE = Path(__file__).parent / "demo_client_credentials.json"

BUILD_STREAM_ARTIFACT_ROOT = "/opt/omnia/build_stream/artifacts"
CATALOG_FILE = Path("/opt/omnia/windsurf/working_dir/demo/catalog_rhel.json")

class ParseCatalogDemo:
    """Complete demo class for parse-catalog functionality."""

    def __init__(self, cleanup=False):
        self.base_url = BASE_URL

        # Client configuration
        self.client_name = CLIENT_NAME

        # Build Stream artifact root
        self.build_stream_artifact_root = BUILD_STREAM_ARTIFACT_ROOT

        # Authentication credentials for build_stream registration
        # These are the credentials used to register new OAuth clients
        self.auth_username = AUTH_USERNAME
        self.auth_password = AUTH_PASSWORD

        # Creates this file if it doesn't exist, for future use,
        # if exists it uses the client_id and client_secret from it
        self.credentials_file = CREDENTIALS_FILE

        self.catalog_file = CATALOG_FILE

        # Load existing credentials or set to None
        self.client_id = None
        self.client_secret = None
        self.load_credentials()

        self.access_token = None
        self.job_id = None
        self.correlation_id = str(uuid.uuid4())
        self.cleanup = cleanup

    def wait_for_enter(self, message="Press ENTER to continue..."):
        """Wait for user to press enter."""
        input(f"\n⏸️  {message}")

    def load_credentials(self):
        """Load client credentials from file if exists."""
        if self.credentials_file.exists():
            try:
                with open(self.credentials_file, 'r', encoding='utf-8') as f:
                    credentials = json.load(f)
                    client_id = credentials.get('client_id')
                    client_secret = credentials.get('client_secret')

                    # Only update if values are not empty
                    if client_id:
                        self.client_id = client_id
                    if client_secret:
                        self.client_secret = client_secret

                    print(f"📁 Loaded existing credentials from {self.credentials_file}")
                    return True
            except (json.JSONDecodeError, IOError) as e:
                print(f"⚠️  Error loading credentials: {e}")
                return False
        return False

    def save_credentials(self, client_id, client_secret):
        """Save client credentials to file."""
        try:
            credentials = {
                'client_id': client_id,
                'client_secret': client_secret,
                'created_at': time.strftime('%Y-%m-%d %H:%M:%S')
            }
            with open(self.credentials_file, 'w', encoding='utf-8') as f:
                json.dump(credentials, f, indent=2)
            print(f"💾 Saved credentials to {self.credentials_file}")
            return True
        except (json.JSONDecodeError, IOError) as e:
            print(f"⚠️  Error saving credentials: {e}")
            return False

    def cleanup_artifacts(self):
        """Delete all contents inside build_stream_artifact_root."""
        print("\n" + "="*60)
        print("🧹 CLEANUP: Removing Existing Artifacts")
        print("="*60)

        artifacts_path = Path(self.build_stream_artifact_root)

        if not artifacts_path.exists():
            print(f"📂 Artifacts directory does not exist: {artifacts_path}")
            print("✅ Nothing to clean up")
            return

        print(f"� Artifacts Directory: {artifacts_path}")
        print("⚠️  This will delete all contents inside the artifacts directory")

        self.wait_for_enter("Press ENTER to proceed with cleanup...")

        try:
            # Delete all contents inside the directory
            deleted_count = 0
            for item in artifacts_path.iterdir():
                if item.is_dir():
                    print(f"🗑️  Removing directory: {item.name}/")
                    shutil.rmtree(item)
                    deleted_count += 1
                else:
                    print(f"🗑️  Removing file: {item.name}")
                    item.unlink()
                    deleted_count += 1

            print(f"\n✅ Cleanup completed: {deleted_count} items removed")

        except (OSError, shutil.Error) as e:
            print(f"\n❌ Cleanup failed: {e}")
            print("⚠️  Continuing with demo...")

    def check_server_health(self):
        """Check if the server is running."""
        print("\n" + "="*60)
        print("🏥 STEP 0: Health Check")
        print("="*60)
        print(f"📡 Endpoint: GET {self.base_url}/health")

        self.wait_for_enter("Press ENTER to check server health...")

        try:
            response = requests.get(f"{self.base_url}/health", timeout=5, verify=False)
            print(f"\n✅ Response Status: {response.status_code}")
            print(f"📝 Response Body: {json.dumps(response.json(), indent=2)}")
            return response.status_code == 200
        except requests.exceptions.ConnectionError:
            print(f"\n❌ Server not running at {self.base_url}")
            print("   Start server with: uvicorn main:app --host 0.0.0.0 --port 8010")
            return False
        except (requests.exceptions.RequestException, ValueError) as e:
            print(f"\n❌ Error: {e}")
            return False

    def register_client(self):
        """Register OAuth client or use existing one."""
        print("\n" + "="*60)
        print("📝 STEP 1: Register OAuth Client")
        print("="*60)

        # If we already have credentials, skip registration
        if self.client_secret:
            print("✅ Using provided credentials!")
            print(f"   Client ID: {self.client_id}")
            print(f"   Client Secret: {self.client_secret}")
            print("\n💡 Skipping registration - using existing credentials")
            return True

        # Authentication credentials for build_stream registration
        # These are the credentials used to register new OAuth clients
        # The vault shows: username="build_stream_register" with password_hash for "dell1234"
        # But the actual system might be using different credentials
        print(f"🔐 Using auth credentials: {self.auth_username}:"
              f"{self.auth_password}")
        auth_header = base64.b64encode(f"{self.auth_username}:{self.auth_password}".encode()).decode()

        client_data = {
            "client_id": self.client_id,
            "client_name": self.client_name,
            "allowed_scopes": ["catalog:read", "catalog:write","job:write"],
            "grant_types": ["client_credentials"]
        }

        print(f"📡 Endpoint: POST {self.base_url}/api/v1/auth/register")
        print("📝 Headers:")
        print("   Content-Type: application/json")
        print(f"   Authorization: Basic {auth_header}")
        print("📝 Request Body:")
        print(json.dumps(client_data, indent=2))

        self.wait_for_enter("Press ENTER to register client...")

        try:
            response = requests.post(
                f"{self.base_url}/api/v1/auth/register",
                json=client_data,
                headers={
                    "Content-Type": "application/json",
                    "Authorization": f"Basic {auth_header}"
                },
                timeout=30,
                verify=False
            )

            print(f"\n✅ Response Status: {response.status_code}")

            if response.status_code in [200, 201]:
                client_info = response.json()
                print("📋 Response Body:")
                # Mask the secret for display
                display_info = client_info.copy()
                if 'client_secret' in display_info:
                    display_info['client_secret'] = display_info['client_secret'][:8] + "..." + display_info['client_secret'][-4:]
                print(json.dumps(display_info, indent=2))

                self.client_secret = client_info.get('client_secret')
                self.client_id = client_info.get('client_id')  # Use server-assigned ID
                print("\n✅ Client registered successfully!")
                print(f"   Client ID: {self.client_id}")
                print(f"   Client Secret: {self.client_secret}")

                # Save credentials to file for future use
                self.save_credentials(self.client_id, self.client_secret)

                print(f"\n💡 Credentials saved to {self.credentials_file}")
                print("💡 Next run will automatically use these credentials!")
                return True
            elif response.status_code == 409:
                # Client already exists, try to use existing one
                print("📋 Response Body:")
                print(response.text)
                print("\n⚠️  Client registration failed (max clients reached)")
                print("💡 Attempting to use existing client...")

                # Try to get token with a known existing client
                existing_client_id = "bld_daa6c90eff86b1036c9f922a098562e5"
                existing_client_secret = "bld_s_bUrHRr663yUldYraSQ1sDEWyR7x2x_6gPrVomUpnFtw"

                # Test if existing client works
                token_data = {
                    "grant_type": "client_credentials",
                    "client_id": existing_client_id,
                    "client_secret": existing_client_secret
                }

                token_response = requests.post(
                    f"{self.base_url}/api/v1/auth/token",
                    data=token_data,
                    headers={"Content-Type": "application/x-www-form-urlencoded"},
                    timeout=30,
                    verify=False
                )

                if token_response.status_code == 200:
                    self.client_id = existing_client_id
                    self.client_secret = existing_client_secret
                    print("✅ Using existing client!")
                    print(f"   Client ID: {self.client_id}")
                    print(f"   Client Secret: {self.client_secret}")
                    print("\n💡 These credentials are working for this session")
                    return True
                else:
                    print("❌ Existing client also failed")
                    return False
            else:
                print("📋 Response Body:")
                print(response.text)
                print("\n❌ Registration failed")
                return False

        except Exception as e:
            print(f"\n❌ Error: {e}")
            return False

    def get_access_token(self):
        """Get JWT access token."""
        print("\n" + "="*60)
        print("🔑 STEP 2: Get Access Token")
        print("="*60)

        token_data = {
            "grant_type": "client_credentials",
            "client_id": self.client_id,
            "client_secret": self.client_secret
        }

        print(f"📡 Endpoint: POST {self.base_url}/api/v1/auth/token")
        print("📋 Headers:")
        print("   Content-Type: application/x-www-form-urlencoded")
        print("📋 Request Body:")
        print("   grant_type=client_credentials")
        print(f"   client_id={self.client_id}")
        print(f"   client_secret={self.client_secret[:8]}...{self.client_secret[-4:]}")

        self.wait_for_enter("Press ENTER to get access token...")

        try:
            response = requests.post(
                f"{self.base_url}/api/v1/auth/token",
                data=token_data,
                headers={"Content-Type": "application/x-www-form-urlencoded"},
                timeout=30,
                verify=False
            )

            print(f"\n✅ Response Status: {response.status_code}")

            if response.status_code in [200, 201]:
                token_info = response.json()
                self.access_token = token_info.get("access_token")

                # Mask token for display
                display_info = token_info.copy()
                if 'access_token' in display_info:
                    display_info['access_token'] = display_info['access_token'][:20] + "..." + display_info['access_token'][-10:]

                print("📋 Response Body:")
                print(json.dumps(display_info, indent=2))
                print("\n✅ Access token obtained!")
                return True
            else:
                print("📋 Response Body:")
                print(response.text)
                print("\n❌ Token request failed")

                # Check if this is an authentication error (401/403)
                if response.status_code in [401, 403]:
                    print("\n🔄 The access token request failed with authentication error.")
                    print("💡 This might be due to expired or invalid client credentials.")
                    return "retry_register"

                return False

        except Exception as e:
            print(f"\n❌ Error: {e}")
            return False

    def create_job(self):
        """Create a job for parse-catalog."""
        print("\n" + "="*60)
        print("🧾 STEP 3: Create Job")
        print("="*60)

        job_data = {
            "correlation_id": self.correlation_id,
            "client_id": self.client_id
        }

        idempotency_key = str(uuid.uuid4())

        print(f"📡 Endpoint: POST {self.base_url}/api/v1/jobs")
        print("📋 Headers:")
        print("   Content-Type: application/json")
        print(f"   Authorization: Bearer {self.access_token[:20]}...{self.access_token[-10:]}")
        print(f"   Idempotency-Key: {idempotency_key}")
        print("📋 Request Body:")
        print(json.dumps(job_data, indent=2))

        self.wait_for_enter("Press ENTER to create job...")

        try:
            response = requests.post(
                f"{self.base_url}/api/v1/jobs",
                json=job_data,
                headers={
                    "Content-Type": "application/json",
                    "Authorization": f"Bearer {self.access_token}",
                    "Idempotency-Key": idempotency_key
                },
                timeout=30,
                verify=False
            )

            print(f"\n✅ Response Status: {response.status_code}")

            if response.status_code in [200, 201]:
                job_info = response.json()
                self.job_id = job_info.get("job_id")
                print("📋 Response Body:")
                print(json.dumps(job_info, indent=2))
                print(f"\n✅ Job created: {self.job_id}")
                return True
            else:
                print("📋 Response Body:")
                print(response.text)
                print("\n❌ Job creation failed")
                return False

        except Exception as e:
            print(f"\n❌ Error: {e}")
            return False

    def get_job_info(self):
        """Get job information using GET /api/v1/jobs/{job_id}."""
        print("\n" + "="*60)
        print("📋 Job Status Check")
        print("="*60)

        print(f"📡 Endpoint: GET {self.base_url}/api/v1/jobs/{self.job_id}")
        print("📋 Headers:")
        print(f"   Authorization: Bearer {self.access_token[:20]}...{self.access_token[-10:]}")

        try:
            response = requests.get(
                f"{self.base_url}/api/v1/jobs/{self.job_id}",
                headers={"Authorization": f"Bearer {self.access_token}"},
                timeout=30,
                verify=False
            )

            print(f"\n✅ Response Status: {response.status_code}")

            if response.status_code == 200:
                job_info = response.json()
                print("📋 Response Body:")
                print(json.dumps(job_info, indent=2))

                # Show stage summary
                stages = job_info.get("stages", [])
                print("\n📊 Stage Summary:")
                for stage in stages:
                    status_emoji = "✅" if stage.get("stage_state") == "COMPLETED" else "⏳" if stage.get("stage_state") == "PENDING" else "❌"
                    status_emoji = (
                        "✅" if stage.get("stage_state") == "COMPLETED"
                        else "⏳" if stage.get("stage_state") == "PENDING"
                        else "❌"
                    )

                return job_info
            else:
                print("📋 Response Body:")
                print(response.text)
                print("\n❌ Failed to get job info")
                return None

        except Exception as e:
            print(f"\n❌ Error: {e}")
            return None

    def parse_catalog(self):
        """Parse the catalog file."""
        print("\n" + "="*60)
        print("📝 STEP 4: Parse Catalog")
        print("="*60)

        # Use the configured catalog file
        catalog_file = self.catalog_file

        if not catalog_file.exists():
            print(f"❌ Catalog file not found: {catalog_file}")
            return False

        print(f"ðŸ“ Catalog File: {catalog_file}")
        print(f"📊 File Size: {catalog_file.stat().st_size:,} bytes")

        print(f"\n📡 Endpoint: POST {self.base_url}/api/v1/jobs/{self.job_id}/stages/parse-catalog")
        print("📋 Headers:")
        print(f"   Authorization: Bearer {self.access_token[:20]}...{self.access_token[-10:]}")
        print("📋 Files:")
        print(f"   file=@{catalog_file.name}")

        self.wait_for_enter("Press ENTER to parse catalog...")

        try:
            with open(catalog_file, 'rb') as f:
                files = {'file': (catalog_file.name, f, 'application/json')}
                response = requests.post(
                    f"{self.base_url}/api/v1/jobs/{self.job_id}/stages/parse-catalog",
                    files=files,
                    headers={"Authorization": f"Bearer {self.access_token}"},
                    timeout=60,  # Longer timeout for file upload
                    verify=False
                )

                print(f"\n✅ Response Status: {response.status_code}")

                if response.status_code in [200, 201]:
                    result = response.json()
                    print("📋 Response Body:")
                    print(json.dumps(result, indent=2))
                    print("\n✅ Parse catalog successful!")

                    # Get job info after parse catalog
                    self.get_job_info()
                    return True
                else:
                    print("📋 Response Body:")
                    print(response.text)
                    print("\n❌ Parse catalog failed!")
                    return False

        except Exception as exc:
            print(f"\n❌ Error: {exc}")
            return False

    def generate_input_files(self):
        """Generate input files using the parsed catalog."""
        print("\n" + "="*60)
        print("⚙️  STEP 5: Generate Input Files")
        print("="*60)

        print(f"\n📡 Endpoint: POST {self.base_url}/api/v1/jobs/{self.job_id}/stages/generate-input-files")
        print("📋 Headers:")
        print(f"   Authorization: Bearer {self.access_token[:20]}...{self.access_token[-10:]}")
        print("📋 Request Body: (empty, uses default adapter policy)")

        self.wait_for_enter("Press ENTER to generate input files...")

        try:
            response = requests.post(
                f"{self.base_url}/api/v1/jobs/{self.job_id}/stages/generate-input-files",
                headers={"Authorization": f"Bearer {self.access_token}"},
                timeout=30,
                verify=False
            )

            print(f"\n✅ Response Status: {response.status_code}")

            if response.status_code in [200, 201]:
                result = response.json()
                print("📋 Response Body:")
                print(json.dumps(result, indent=2))
                print("\n✅ Generate input files successful!")

                # Get job info after generate input files
                self.get_job_info()
                return True
            else:
                print("📋 Response Body:")
                print(response.text)
                print("\n❌ Generate input files failed")
                return False

        except Exception as e:
            print(f"\n❌ Error: {e}")
            return False

    def show_artifacts(self):
        """Show generated artifacts using tree command."""
        print("\n" + "="*60)
        print("📦 STEP 6: View Generated Artifacts")
        print("="*60)

        catalog_artifact_path = Path(self.build_stream_artifact_root) / "catalog"
        input_files_artifact_path = Path(self.build_stream_artifact_root) / "input-files"
        job_id_artifact_path = Path(self.build_stream_artifact_root) / self.job_id

        print(f"📂 Catalog artifacts: {catalog_artifact_path}")
        print(f"📂 Input files artifacts: {input_files_artifact_path}")
        print(f"📂 Job ID artifacts: {job_id_artifact_path}")

        self.wait_for_enter("Press ENTER to view artifacts...")

        # Show catalog artifacts
        if catalog_artifact_path.exists():
            print("\n📦 Catalog Artifacts:")
            try:
                result = subprocess.run(
                    ["tree", "-L", "2", "-h", str(catalog_artifact_path)],
                    capture_output=True,
                    text=True,
                    check=True
                )
                if result.returncode == 0:
                    print(result.stdout)
                else:
                    self._fallback_artifact_list(catalog_artifact_path)
            except:
                self._fallback_artifact_list(catalog_artifact_path)
        else:
            print("\n❌ No catalog artifacts directory found")

        # Show input files artifacts
        if input_files_artifact_path.exists():
            print("\n📦 Input Files Artifacts:")
            try:
                result = subprocess.run(
                    ["tree", "-L", "2", "-h", str(input_files_artifact_path)],
                    capture_output=True,
                    text=True,
                    check=True
                )
                if result.returncode == 0:
                    print(result.stdout)
                else:
                    self._fallback_artifact_list(input_files_artifact_path)
            except:
                self._fallback_artifact_list(input_files_artifact_path)
        else:
            print("\n❌ No input files artifacts directory found")

        # Show job ID artifacts
        if job_id_artifact_path.exists():
            print("\n📦 Job ID Artifacts:")
            try:
                result = subprocess.run(
                    ["tree", str(job_id_artifact_path)],
                    capture_output=True,
                    text=True
                )
                if result.returncode == 0:
                    print(result.stdout)
                else:
                    self._fallback_artifact_list(job_id_artifact_path)
            except:
                self._fallback_artifact_list(job_id_artifact_path)
        else:
            print(f"\n❌ Job ID artifacts directory not found: {job_id_artifact_path}")

        # Show content preview of the most recent artifacts
        self._show_latest_artifacts_preview(catalog_artifact_path, input_files_artifact_path)

    def _fallback_artifact_list(self, artifact_path):
        """Fallback method to list artifacts when tree command is not available."""
        artifacts = sorted(artifact_path.iterdir(), key=lambda x: x.stat().st_mtime, reverse=True)
        for artifact_dir in artifacts:
            if artifact_dir.is_dir():
                print(f"\n📦 {artifact_dir.name}/")
                for f in artifact_dir.iterdir():
                    size = f.stat().st_size
                    print(f"   📝 {f.name} ({size:,} bytes)")

    def _show_latest_artifacts_preview(self, catalog_path, input_files_path):
        """Show content preview of the most recent artifacts."""
        # Show latest catalog artifact
        if catalog_path.exists():
            catalog_artifacts = sorted(catalog_path.iterdir(), key=lambda x: x.stat().st_mtime, reverse=True)
            if catalog_artifacts:
                latest_catalog = catalog_artifacts[0]
                print(f"\n📋 Latest Catalog Artifact: {latest_catalog.name}")

                for f in latest_catalog.iterdir():
                    if f.name.endswith('.bin'):
                        print(f"\n📝 Content preview of {f.name}:")
                        try:
                            content = f.read_text()[:300]
                            print(content)
                            if len(f.read_text()) > 300:
                                print("...")
                        except:
                            print("   [binary data]")
                    elif f.name.endswith('.zip'):
                        print(f"\n📦 Archive contents of {f.name}:")
                        try:
                            result = subprocess.run(
                                ["unzip", "-l", str(f)],
                                capture_output=True,
                                text=True
                            )
                            if result.returncode == 0:
                                print(result.stdout)
                        except:
                            print("   [unable to list archive contents]")

        # Show latest input files artifact
        if input_files_path.exists():
            input_artifacts = sorted(input_files_path.iterdir(), key=lambda x: x.stat().st_mtime, reverse=True)
            if input_artifacts:
                latest_input = input_artifacts[0]
                print(f"\n📋 Latest Input Files Artifact: {latest_input.name}")

                for f in latest_input.iterdir():
                    if f.name.endswith('.zip'):
                        print(f"\n📦 Archive contents of {f.name}:")
                        try:
                            result = subprocess.run(
                                ["unzip", "-l", str(f)],
                                capture_output=True,
                                text=True
                            )
                            if result.returncode == 0:
                                print(result.stdout)
                        except:
                            print("   [unable to list archive contents]")

    def create_local_repository(self):
        """Create local repository using the generated input files."""
        print("\n" + "="*60)
        print("🏗️  STEP 7: Create Local Repository")
        print("="*60)

        print(f"\n📡 Endpoint: POST {self.base_url}/api/v1/jobs/{self.job_id}/stages/create-local-repository")
        print("📋 Headers:")
        print(f"   Authorization: Bearer {self.access_token[:20]}...{self.access_token[-10:]}")
        print("📋 Request Body: (empty, uses job context from previous stages)")

        self.wait_for_enter("Press ENTER to create local repository...")

        try:
            response = requests.post(
                f"{self.base_url}/api/v1/jobs/{self.job_id}/stages/create-local-repository",
                headers={"Authorization": f"Bearer {self.access_token}"},
                timeout=30,
                verify=False
            )

            print(f"\n✅ Response Status: {response.status_code}")

            if response.status_code in [200, 201, 202]:
                result = response.json()
                print("📋 Response Body:")
                print(json.dumps(result, indent=2))
                print("\n✅ Create local repository successful!")

                # Get job info after create local repository
                self.get_job_info()
                return True
            else:
                print("📋 Response Body:")
                print(response.text)
                print("\n❌ Create local repository failed")
                return False

        except Exception as e:
            print(f"\n❌ Error: {e}")
            return False

    def _trigger_build_image_stage(self, step_label: str, architecture: str, functional_groups, inventory_host: str | None):
        print("\n" + "="*60)
        print(step_label)
        print("="*60)

        if not self.job_id:
            print("❌ No job_id available. Create a job before triggering this stage.")
            return False

        payload = {
            "architecture": architecture,
            "image_key": "demo-build-image",
            "functional_groups": functional_groups,
        }

        if inventory_host:
            payload["inventory_host"] = inventory_host

        print(f"📍 Endpoint: POST {self.base_url}/api/v1/jobs/{self.job_id}/stages/build-image")
        print("📋 Headers:")
        print(f"   Authorization: Bearer {self.access_token[:20]}...{self.access_token[-10:]}")
        print("📋 Request Body:")
        print(json.dumps(payload, indent=2))

        self.wait_for_enter("Press ENTER to trigger build-image stage...")

        try:
            response = requests.post(
                f"{self.base_url}/api/v1/jobs/{self.job_id}/stages/build-image",
                json=payload,
                headers={"Authorization": f"Bearer {self.access_token}"},
                timeout=60,  # Longer timeout for build operations
                verify=False,
            )

            print(f"\n✅ Response Status: {response.status_code}")

            if response.status_code in (200, 202):
                print("📋 Response Body:")
                print(json.dumps(response.json(), indent=2))
                print("\n✅ Build image stage triggered!")
                return True

            print("📋 Response Body:")
            print(response.text)
            print("\n❌ Failed to trigger build image stage")
            return False

        except Exception as exc:
            print(f"\n❌ Error: {exc}")
            return False

    def trigger_build_image_x86_64_stage(self):
        """Trigger build image stage for x86_64 architecture."""
        groups = [
            "service_kube_control_plane_first_x86_64",
            "service_kube_control_plane_x86_64",
            "service_kube_node_x86_64",
            "slurm_control_node_x86_64",
            "slurm_node_x86_64",
            "login_node_x86_64",
            "login_compiler_node_x86_64",
        ]
        return self._trigger_build_image_stage(
            "🛠️  STEP 8A: Trigger Build Image Stage (x86_64)",
            "x86_64",
            groups,
            inventory_host=None,
        )

    def trigger_build_image_aarch64_stage(self):
        """Trigger build image stage for aarch64 architecture."""
        groups = [
            "slurm_node_aarch64",
            "login_node_aarch64",
            "login_compiler_node_aarch64",
        ]
        return self._trigger_build_image_stage(
            "🛠️  STEP 8B: Trigger Build Image Stage (aarch64)",
            "aarch64",
            groups,
            inventory_host="182.10.0.170",
        )

    def run_demo(self):
        """Run the complete demo."""
        print("\n" + "="*60)
        print("🚀 Parse-Catalog Interactive Demo")
        print("="*60)
        print("📋 This demo will execute the complete parse-catalog workflow")
        print("📋 using the real catalog_rhel.json file")
        print("  Press ENTER at each step to proceed")
        print("="*60)
        print(f"\n🔑 Demo Client ID: {self.client_id}")
        print(f"🔑 Correlation ID: {self.correlation_id}")

        try:
            # Cleanup artifacts if requested
            if self.cleanup:
                self.cleanup_artifacts()

            # Step 0: Health check
            if not self.check_server_health():
                return

            # Step 1: Register client (with retry loop)
            while True:
                # Step 1: Register client
                if not self.register_client():
                    return

                # Step 2: Get access token
                token_result = self.get_access_token()
                if token_result == True:
                    # Success, break the retry loop
                    break
                elif token_result == "retry_register":
                    # Ask user if they want to try registering again
                    while True:
                        user_input = input("\n❓ Do you want to try to register again? (yes/no): ").strip().lower()
                        if user_input in ['yes', 'y', 'no', 'n']:
                            break
                        print("   Please enter 'yes' or 'no'")

                    if user_input in ['yes', 'y']:
                        print("\n🔄 Attempting to register new client...")
                        # Clear existing credentials and continue the loop to retry
                        self.client_id = None
                        self.client_secret = None
                        continue
                    else:
                        print("\n⚠️  Continuing without valid credentials - demo cannot proceed.")
                        return
                else:
                    # Other failure, exit
                    return

            # Step 3: Create job
            if not self.create_job():
                return

            # Step 4: Parse catalog
            if not self.parse_catalog():
                return

            # Step 5: Generate input files
            if not self.generate_input_files():
                return

            # Step 6: Show artifacts
            self.show_artifacts()

            # Step 7: Create local repository
            if not self.create_local_repository():
                return

            # Step 8A: x86_64 build-image stage
            if not self.trigger_build_image_x86_64_stage():
                return

            # Step 8B: aarch64 build-image stage
            if not self.trigger_build_image_aarch64_stage():
                return

            print("\n" + "="*60)
            print("✅ Demo Completed Successfully!")
            print("="*60)
            print(f"📊 Client ID: {self.client_id}")
            print(f"📊 Job ID: {self.job_id}")
            print(f"📊 Correlation ID: {self.correlation_id}")
            print(f"📦 Catalog Artifacts: {Path(self.build_stream_artifact_root) / 'catalog'}/")
            print(f"📦 Input Files Artifacts: {Path(self.build_stream_artifact_root) / 'input-files'}/")
            print("📦 Local Repository: Created via Ansible playbook")
            print("📦 Build Image Stage: Submitted for both x86_64 and aarch64")
            print("="*60)

        except KeyboardInterrupt:
            print("\n\n⚠️ Demo interrupted by user")
        except Exception as e:
            print(f"\n\n❌ Demo failed: {e}")


def main():
    """Main entry point with argument parsing."""
    parser = argparse.ArgumentParser(
        description="Parse-Catalog Interactive Demo",
        formatter_class=argparse.RawDescriptionHelpFormatter,
        epilog="""
Examples:
    # Register a new client
    python buildstream_demo.py

    # Clean artifacts and register new client
    python buildstream_demo.py --cleanup
     """
    )

    parser.add_argument(
        "--cleanup",
        action="store_true",
        help="Delete all contents in /opt/omnia/build_stream/artifacts before starting demo"
    )

    args = parser.parse_args()

    # Create and run demo
    demo = ParseCatalogDemo(cleanup=args.cleanup)
    demo.run_demo()


if __name__ == "__main__":
    main()


================================================
FILE: build_stream/tests/end_to_end/api/conftest.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Pytest fixtures for integration tests with real Ansible Vault."""

# pylint: disable=redefined-outer-name,consider-using-with

import base64
import logging
import os
import secrets
import shutil
import signal
import socket
import string
import subprocess
import tempfile
import time
from pathlib import Path
from typing import Dict, Generator, Optional

import httpx
import pytest
import yaml
from argon2 import PasswordHasher, Type  # noqa: E0611 pylint: disable=no-name-in-module

# Configure logging for integration tests
logging.basicConfig(
    level=logging.INFO,
    format="%(asctime)s - %(name)s - %(levelname)s - %(message)s",
)
logger = logging.getLogger("integration_tests")


def generate_secure_test_password(length: int = 24) -> str:
    """Generate a secure password for integration tests.

    Args:
        length: Length of the password (default: 24 for extra security)

    Returns:
        Secure random password
    """
    # Use stronger character set for integration tests
    lowercase = string.ascii_lowercase
    uppercase = string.ascii_uppercase
    digits = string.digits
    special = "!@#$%^&*()_+-=[]{}|;:,.<>?"

    # Ensure minimum security requirements
    if length < 16:
        raise ValueError("Password length must be at least 16 characters")

    # Start with one of each required character type
    password = [
        secrets.choice(lowercase),
        secrets.choice(uppercase),
        secrets.choice(digits),
        secrets.choice(special),
    ]

    # Fill remaining length
    all_chars = lowercase + uppercase + digits + special
    for _ in range(length - 4):
        password.append(secrets.choice(all_chars))

    # Shuffle to avoid predictable pattern
    secrets.SystemRandom().shuffle(password)

    return ''.join(password)


def generate_test_client_secret(length: int = 32) -> str:
    """Generate a test client secret with proper bld_s_ prefix.

    Args:
        length: Total length of the secret including prefix (default: 32)

    Returns:
        Test client secret with bld_s_ prefix
    """
    if length < 8:
        raise ValueError("Client secret length must be at least 8 characters")

    # Generate random part (subtract 6 for "bld_s_" prefix)
    random_part_length = max(8, length - 6)
    random_part = generate_secure_test_password(random_part_length)

    return f"bld_s_{random_part}"


def generate_invalid_client_id() -> str:
    """Generate an invalid client ID for testing (missing bld_ prefix).

    Returns:
        Invalid client ID without proper prefix
    """
    return (
        "invalid_client_id_" + 
        ''.join(secrets.choice(string.ascii_lowercase + string.digits) for _ in range(8))
    )


def generate_invalid_client_secret() -> str:
    """Generate an invalid client secret for testing (missing bld_s_ prefix).

    Returns:
        Invalid client secret without proper prefix
    """
    return (
        "invalid_secret_" + 
        ''.join(secrets.choice(string.ascii_lowercase + string.digits) for _ in range(8))
    )


class IntegrationTestConfig:
    """Configuration for integration tests."""

    # Username is not a secret
    AUTH_USERNAME = "build_stream_registrar"
    SERVER_HOST = "127.0.0.1"
    SERVER_PORT = 18443  # Use different port to avoid conflicts
    SERVER_STARTUP_TIMEOUT = 30

    @classmethod
    def get_vault_password(cls) -> str:
        """Get a dynamically generated vault password.

        Returns:
            Secure random vault password
        """
        return generate_secure_test_password(24)

    @classmethod
    def get_auth_password(cls) -> str:
        """Get a dynamically generated auth password.

        Returns:
            Secure random auth password
        """
        return generate_secure_test_password(24)


class VaultManager:  # noqa: R0902 pylint: disable=too-many-instance-attributes
    """Manages Ansible Vault setup and teardown for integration tests."""

    def __init__(self, base_dir: str):
        """Initialize vault manager.

        Args:
            base_dir: Base directory for test vault files.
        """
        self.base_dir = Path(base_dir)
        self.vault_dir = self.base_dir / "vault"
        self.vault_file = self.vault_dir / "build_stream_oauth_credentials.yml"
        self.vault_pass_file = self.base_dir / ".vault_pass"
        self.keys_dir = self.base_dir / "keys"
        self.private_key_file = self.keys_dir / "jwt_private.pem"
        self.public_key_file = self.keys_dir / "jwt_public.pem"
        self._hasher = PasswordHasher(
            time_cost=3,
            memory_cost=65536,
            parallelism=4,
            hash_len=32,
            salt_len=16,
            type=Type.ID,
        )

    def setup(self, username: str, password: str) -> None:
        """Set up vault with initial credentials.

        Args:
            username: Registration username.
            password: Registration password.
        """
        logger.info("Setting up Ansible Vault...")
        logger.info("  Vault directory: %s", self.vault_dir)
        logger.info("  Vault file: %s", self.vault_file)
        logger.info("  Vault password file: %s", self.vault_pass_file)

        self.vault_dir.mkdir(parents=True, exist_ok=True)
        logger.info("  Created vault directory")

        self.vault_pass_file.write_text(IntegrationTestConfig.get_vault_password())
        self.vault_pass_file.chmod(0o600)
        logger.info("  Created vault password file")

        logger.info("  Generating Argon2id password hash...")
        password_hash = self._hasher.hash(password)

        vault_content = {
            "auth_registration": {
                "username": username,
                "password_hash": password_hash,
            },
            "oauth_clients": {},
        }

        with tempfile.NamedTemporaryFile(
            mode="w", suffix=".yml", delete=False
        ) as temp_file:
            yaml.safe_dump(vault_content, temp_file, default_flow_style=False)
            temp_path = temp_file.name

        try:
            logger.info("  Encrypting vault with ansible-vault...")
            subprocess.run(
                [
                    "ansible-vault",
                    "encrypt",
                    temp_path,
                    "--vault-password-file",
                    str(self.vault_pass_file),
                    "--encrypt-vault-id",
                    "default",
                ],
                check=True,
                capture_output=True,
            )

            shutil.move(temp_path, str(self.vault_file))
            self.vault_file.chmod(0o600)
            logger.info("  Vault encrypted and saved successfully")
        finally:
            if os.path.exists(temp_path):
                os.unlink(temp_path)

        logger.info("Vault setup complete")

        # Generate JWT keys for token signing
        self._generate_jwt_keys()

    def _generate_jwt_keys(self) -> None:
        """Generate RSA key pair for JWT signing in e2e tests."""
        logger.info("Generating JWT keys for e2e tests...")
        logger.info("  Keys directory: %s", self.keys_dir)

        self.keys_dir.mkdir(parents=True, exist_ok=True)

        # Generate RSA private key (2048-bit for faster tests)
        subprocess.run(
            [
                "openssl", "genrsa",
                "-out", str(self.private_key_file),
                "2048",
            ],
            check=True,
            capture_output=True,
        )
        self.private_key_file.chmod(0o600)
        logger.info("  Generated private key: %s", self.private_key_file)

        # Extract public key
        subprocess.run(
            [
                "openssl", "rsa",
                "-in", str(self.private_key_file),
                "-pubout",
                "-out", str(self.public_key_file),
            ],
            check=True,
            capture_output=True,
        )
        self.public_key_file.chmod(0o644)
        logger.info("  Generated public key: %s", self.public_key_file)
        logger.info("JWT keys generated successfully")

    def cleanup(self) -> None:
        """Clean up vault files."""
        logger.info("Cleaning up vault files at: %s", self.base_dir)
        if self.base_dir.exists():
            shutil.rmtree(self.base_dir)
        logger.info("Vault cleanup complete")


class ServerManager:
    """Manages FastAPI server lifecycle for integration tests."""

    REQUIRED_PACKAGES = [
        "fastapi",
        "uvicorn",
        "pydantic",
        "PyJWT",
        "argon2-cffi",
        "pyyaml",
        "httpx",
        "python-multipart",
        "jsonschema",
        "ansible",
        "cryptography",
        "dependency-injector",
    ]

    def __init__(  # noqa: R0913,R0917 pylint: disable=too-many-arguments,too-many-positional-arguments
        self,
        host: str,
        port: int,
        vault_manager: VaultManager,  # noqa: W0621
        project_dir: str,  # noqa: W0621
        venv_dir: str,  # noqa: W0621
    ):
        """Initialize server manager.

        Args:
            host: Server host.
            port: Server port.
            vault_manager: Vault manager instance.
            project_dir: Path to build_stream project directory.
            venv_dir: Path to virtual environment directory.
        """
        self.host = host
        self.port = port
        self.vault_manager = vault_manager
        self.project_dir = project_dir
        self.venv_dir = Path(venv_dir)
        self.process: Optional[subprocess.Popen] = None

    def _setup_venv(self) -> None:
        """Create virtual environment and install dependencies."""
        logger.info("Setting up Python virtual environment...")
        logger.info("  Venv directory: %s", self.venv_dir)

        if not self.venv_dir.exists():
            logger.info("  Creating virtual environment...")
            subprocess.run(
                ["python3", "-m", "venv", str(self.venv_dir)],
                check=True,
                capture_output=True,
            )
            logger.info("  Virtual environment created")
        else:
            logger.info("  Virtual environment already exists")

        pip_path = self.venv_dir / "bin" / "pip"
        logger.info("  Upgrading pip...")
        subprocess.run(
            [str(pip_path), "install", "--upgrade", "pip", "-q"],
            check=True,
            capture_output=True,
        )

        logger.info("  Installing dependencies: %s", ", ".join(self.REQUIRED_PACKAGES))
        subprocess.run(
            [str(pip_path), "install", "-q"] + self.REQUIRED_PACKAGES,
            check=True,
            capture_output=True,
        )
        logger.info("  Dependencies installed successfully")

    @property
    def python_path(self) -> str:
        """Get path to Python executable in virtual environment."""
        return str(self.venv_dir / "bin" / "python")

    def _is_port_in_use(self) -> bool:
        """Check if the port is already in use."""
        with socket.socket(socket.AF_INET, socket.SOCK_STREAM) as s:
            return s.connect_ex((self.host, self.port)) == 0

    def _free_port(self) -> None:
        """Free the port if it's in use."""
        if self._is_port_in_use():
            try:
                result = subprocess.run(
                    ["lsof", "-t", f"-i:{self.port}"],
                    capture_output=True,
                    text=True,
                    check=False,
                )
                if result.stdout.strip():
                    for pid in result.stdout.strip().split("\n"):
                        try:
                            os.kill(int(pid), signal.SIGKILL)
                        except (ProcessLookupError, ValueError):
                            pass
                    time.sleep(1)
            except FileNotFoundError:
                pass

    def start(self) -> None:
        """Start the FastAPI server."""
        logger.info("Starting FastAPI server...")
        self._setup_venv()

        logger.info("  Freeing port %d if in use...", self.port)
        self._free_port()

        logger.info("  Configuring server environment variables...")
        env = os.environ.copy()
        env.update({
            "HOST": self.host,
            "PORT": str(self.port),
            "ANSIBLE_VAULT_PASSWORD_FILE": str(self.vault_manager.vault_pass_file),
            "OAUTH_CLIENTS_VAULT_PATH": str(self.vault_manager.vault_file),
            "AUTH_CONFIG_VAULT_PATH": str(self.vault_manager.vault_file),
            "JWT_PRIVATE_KEY_PATH": str(self.vault_manager.private_key_file),
            "JWT_PUBLIC_KEY_PATH": str(self.vault_manager.public_key_file),
            "LOG_LEVEL": "DEBUG",
            "PYTHONPATH": str(self.project_dir),
        })
        logger.info("    HOST=%s", self.host)
        logger.info("    PORT=%s", self.port)
        logger.info("    ANSIBLE_VAULT_PASSWORD_FILE=%s", self.vault_manager.vault_pass_file)
        logger.info("    OAUTH_CLIENTS_VAULT_PATH=%s", self.vault_manager.vault_file)
        logger.info("    AUTH_CONFIG_VAULT_PATH=%s", self.vault_manager.vault_file)
        logger.info("    JWT_PRIVATE_KEY_PATH=%s", self.vault_manager.private_key_file)
        logger.info("    JWT_PUBLIC_KEY_PATH=%s", self.vault_manager.public_key_file)
        logger.info("    LOG_LEVEL=DEBUG")
        logger.info("    PYTHONPATH=%s", self.project_dir)

        logger.info("  Starting uvicorn server...")
        logger.info("    Python: %s", self.python_path)
        logger.info("    Working directory: %s", self.project_dir)

        # Process needs to be managed separately for start/stop lifecycle
        # Cannot use 'with' statement as process must persist after method returns
        self.process = subprocess.Popen(  # noqa: R1732
            [
                self.python_path,
                "-m",
                "uvicorn",
                "main:app",
                "--host",
                self.host,
                "--port",
                str(self.port),
            ],
            cwd=self.project_dir,
            env=env,
            stdout=subprocess.PIPE,
            stderr=subprocess.PIPE,
        )
        logger.info("  Server process started with PID: %d", self.process.pid)

        self._wait_for_server()

    def _wait_for_server(self) -> None:
        """Wait for server to be ready."""
        logger.info("  Waiting for server to be ready (timeout: %ds)...",
                    IntegrationTestConfig.SERVER_STARTUP_TIMEOUT)

        start_time = time.time()
        while time.time() - start_time < IntegrationTestConfig.SERVER_STARTUP_TIMEOUT:
            try:
                response = httpx.get(
                    f"http://{self.host}:{self.port}/health",
                    timeout=1.0,
                )
                if response.status_code == 200:
                    elapsed = time.time() - start_time
                    logger.info("  Server is ready! (took %.1fs)", elapsed)
                    logger.info("  Server URL: http://%s:%d", self.host, self.port)
                    return
            except httpx.RequestError:
                pass
            time.sleep(0.5)

        # Log server output before stopping
        if self.process:
            logger.error("Server failed to start. Checking process output...")
            if self.process.stdout:
                stdout_output = self.process.stdout.read().decode()
                logger.error("Server STDOUT:\n%s", stdout_output)
            if self.process.stderr:
                stderr_output = self.process.stderr.read().decode()
                logger.error("Server STDERR:\n%s", stderr_output)

            # Check process return code
            self.process.poll()
            if self.process.returncode is not None:
                logger.error("Server process exited with code: %s", self.process.returncode)

        self.stop()
        raise RuntimeError(
            f"Server failed to start within {IntegrationTestConfig.SERVER_STARTUP_TIMEOUT}s"
        )

    def stop(self) -> None:
        """Stop the FastAPI server."""
        logger.info("Stopping FastAPI server...")
        if self.process:
            logger.info("  Terminating server process (PID: %d)...", self.process.pid)
            self.process.terminate()
            try:
                self.process.wait(timeout=5)
                logger.info("  Server stopped gracefully")
            except subprocess.TimeoutExpired:
                logger.info("  Server did not stop gracefully, killing...")
                self.process.kill()
                self.process.wait()
                logger.info("  Server killed")
            self.process = None

        self._free_port()
        logger.info("Server shutdown complete")

    @property
    def base_url(self) -> str:
        """Get the server base URL."""
        return f"http://{self.host}:{self.port}"


@pytest.fixture(scope="module")
def integration_test_dir() -> Generator[str, None, None]:
    """Create a temporary directory for integration test files.

    Yields:
        Path to temporary directory.
    """
    temp_dir = tempfile.mkdtemp(prefix="build_stream_integration_")
    yield temp_dir
    shutil.rmtree(temp_dir, ignore_errors=True)


@pytest.fixture(scope="module")
def vault_manager(
    integration_test_dir: str,
    auth_password: str,
) -> Generator[VaultManager, None, None]:  # noqa: W0621
    """Create and configure vault manager.

    Args:
        integration_test_dir: Temporary directory for test files.
        auth_password: The auth password to use for vault setup.

    Yields:
        Configured VaultManager instance.
    """
    manager = VaultManager(integration_test_dir)
    manager.setup(
        username=IntegrationTestConfig.AUTH_USERNAME,
        password=auth_password,
    )
    yield manager
    manager.cleanup()


@pytest.fixture(scope="module")
def project_dir() -> str:
    """Get the build_stream project directory.

    Returns:
        Path to build_stream project directory.
    """
    return str(Path(__file__).parent.parent.parent.parent)


@pytest.fixture(scope="module")
def venv_dir(integration_test_dir: str) -> str:  # noqa: W0621
    """Get path to virtual environment directory.

    Args:
        integration_test_dir: Temporary directory for test files.

    Returns:
        Path to virtual environment directory.
    """
    return os.path.join(integration_test_dir, "venv")


@pytest.fixture(scope="module")
def server_manager(
    vault_manager: VaultManager,  # noqa: W0621
    project_dir: str,  # noqa: W0621
    venv_dir: str,  # noqa: W0621
) -> Generator[ServerManager, None, None]:
    """Create and manage the FastAPI server.

    Args:
        vault_manager: Vault manager fixture.
        project_dir: Project directory fixture.
        venv_dir: Virtual environment directory fixture.

    Yields:
        Running ServerManager instance.
    """
    manager = ServerManager(
        host=IntegrationTestConfig.SERVER_HOST,
        port=IntegrationTestConfig.SERVER_PORT,
        vault_manager=vault_manager,
        project_dir=project_dir,
        venv_dir=venv_dir,
    )
    manager.start()
    yield manager
    manager.stop()


@pytest.fixture(scope="module")
def base_url(server_manager: ServerManager) -> str:  # noqa: W0621
    """Get the server base URL.

    Args:
        server_manager: Server manager fixture.

    Returns:
        Server base URL.
    """
    return server_manager.base_url


@pytest.fixture(scope="module")
def auth_password() -> str:
    """Generate a single auth password for the entire test module.

    Returns:
        Auth password to be used consistently across tests.
    """
    return IntegrationTestConfig.get_auth_password()


@pytest.fixture
def valid_auth_header(auth_password: str) -> Dict[str, str]:  # noqa: W0621
    """Create valid Basic Auth header.

    Args:
        auth_password: The auth password to use.

    Returns:
        Dictionary with Authorization header.
    """
    credentials = base64.b64encode(
        f"{IntegrationTestConfig.AUTH_USERNAME}:{auth_password}".encode()
    ).decode()
    return {"Authorization": f"Basic {credentials}"}


@pytest.fixture
def invalid_auth_header() -> Dict[str, str]:
    """Create invalid Basic Auth header.

    Returns:
        Dictionary with invalid Authorization header.
    """
    credentials = base64.b64encode(b"wrong_user:wrong_password").decode()
    return {"Authorization": f"Basic {credentials}"}


@pytest.fixture
def reset_vault(
    vault_manager: VaultManager,
    auth_password: str,
) -> Generator[None, None, None]:  # noqa: W0621
    """Reset vault to initial state before and after test.

    Args:
        vault_manager: Vault manager fixture.
        auth_password: The auth password to use for vault setup.

    Yields:
        None
    """
    vault_manager.setup(
        username=IntegrationTestConfig.AUTH_USERNAME,
        password=auth_password,
    )
    yield
    vault_manager.setup(
        username=IntegrationTestConfig.AUTH_USERNAME,
        password=auth_password,
    )


================================================
FILE: build_stream/tests/end_to_end/api/test_api_flow_e2e.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""End-to-end integration tests for complete API workflow.

These tests validate the complete OAuth2 authentication workflow from client registration
through token generation and validation. This test suite focuses on authentication
and authorization mechanisms, providing comprehensive coverage of the auth API.

Usage:
    pytest tests/integration/test_api_flow_e2e.py -v -m e2e

Requirements:
    - ansible-vault must be installed
    - Tests require write access to create temporary vault files
    - RSA keys must be available for JWT signing

Test Flow:
    1. Health check - Verify server is running
    2. Client Registration - Register a new OAuth client with proper scopes
    3. Token Generation - Obtain access token using client credentials
    4. Token Validation - Verify JWT structure, uniqueness, and scope enforcement
    5. Error Handling - Test various failure scenarios and security validations
    6. Security Validation - Verify proper security measures are enforced

Test Classes:
    - TestCompleteAPIFlow: Main workflow tests (happy path scenarios)
    - TestAPIFlowErrorHandling: Error scenario testing
    - TestAPIFlowSecurityValidation: Security measure validation

Key Features Tested:
    - OAuth2 client registration with Basic Auth
    - JWT token generation with client_credentials grant
    - Scope-based authorization (catalog:read, catalog:write)
    - Token uniqueness and validation
    - Error handling and security measures
    - Client credential format validation
    - Maximum client limits enforcement

Note: This test suite focuses specifically on authentication and authorization.
Protected API endpoints (like parse_catalog) are tested separately when implemented.
"""

# pylint: disable=redefined-outer-name

from typing import Dict, Optional

import httpx
import pytest

# Import helper functions from conftest
from tests.end_to_end.api.conftest import (
    generate_test_client_secret,
    generate_invalid_client_id,
    generate_invalid_client_secret,
)


class APIFlowContext:  # noqa: R0902 pylint: disable=too-many-instance-attributes
    """Context object to store state across API flow tests.

    This class maintains state between test steps, allowing tests to
    share data like client credentials and access tokens.

    Attributes:
        client_id: Registered client identifier.
        client_secret: Registered client secret.
        access_token: Generated JWT access token.
        token_type: Token type (Bearer).
        expires_in: Token expiration time in seconds.
        scope: Granted scopes.
    """

    def __init__(self):
        """Initialize empty context."""
        self.client_id: Optional[str] = None
        self.client_secret: Optional[str] = None
        self.client_name: Optional[str] = None
        self.allowed_scopes: Optional[list] = None
        self.access_token: Optional[str] = None
        self.token_type: Optional[str] = None
        self.expires_in: Optional[int] = None
        self.scope: Optional[str] = None

    def has_client_credentials(self) -> bool:
        """Check if client credentials are available."""
        return self.client_id is not None and self.client_secret is not None

    def has_access_token(self) -> bool:
        """Check if access token is available."""
        return self.access_token is not None

    def get_auth_header(self) -> Dict[str, str]:
        """Get Authorization header with Bearer token.

        Returns:
            Dictionary with Authorization header.

        Raises:
            ValueError: If access token is not available.
        """
        if not self.has_access_token():
            raise ValueError("Access token not available")
        return {"Authorization": f"Bearer {self.access_token}"}


@pytest.fixture(scope="class")
def api_flow_context():
    """Create a shared context for API flow tests.

    Returns:
        APIFlowContext instance shared across test class.
    """
    return APIFlowContext()


@pytest.mark.e2e
@pytest.mark.integration
class TestCompleteAPIFlow:
    """End-to-end test suite for complete OAuth2 authentication workflow.

    Tests are ordered to follow the natural authentication flow:
    1. Health check - Verify server is running
    2. Client registration - Register OAuth client with scopes
    3. Token generation - Obtain JWT access token
    4. Token validation - Verify token structure and scopes
    5. Scope enforcement - Test subset and unauthorized scope requests
    6. Security validation - Test invalid credentials and token uniqueness

    Each test builds on the previous, storing state in the shared context.
    This covers the complete authentication and authorization workflow.

    Note: Protected API endpoints are not tested here - they are implemented
    separately when the actual endpoints are available.
    """

    def test_01_health_check(
        self,
        base_url: str,
        reset_vault,  # noqa: W0613 pylint: disable=unused-argument
    ):
        """Step 1: Verify server health endpoint is accessible.

        This confirms the server is running and ready to accept requests.
        """
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.get("/health")

        assert response.status_code == 200, f"Health check failed: {response.text}"

        data = response.json()
        assert data["status"] == "healthy"

    def test_02_register_client(
        self,
        base_url: str,
        valid_auth_header: Dict[str, str],
        api_flow_context: APIFlowContext,  # noqa: W0621
    ):
        """Step 2: Register a new OAuth client.

        This creates a client that will be used for subsequent token requests.
        Client credentials are stored in the shared context.
        """
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                "/api/v1/auth/register",
                headers=valid_auth_header,
                json={
                    "client_name": "api-flow-test-client",
                    "description": "Client for complete API flow testing",
                    "allowed_scopes": ["catalog:read", "catalog:write"],
                },
            )

        assert response.status_code == 201, f"Registration failed: {response.text}"

        data = response.json()

        # Verify response structure
        assert "client_id" in data
        assert "client_secret" in data
        assert data["client_id"].startswith("bld_")
        assert data["client_secret"].startswith("bld_s_")

        # Store credentials in context for subsequent tests
        api_flow_context.client_id = data["client_id"]
        api_flow_context.client_secret = data["client_secret"]
        api_flow_context.client_name = data["client_name"]
        api_flow_context.allowed_scopes = data["allowed_scopes"]

    def test_03_request_token(
        self,
        base_url: str,
        api_flow_context: APIFlowContext,  # noqa: W0621
    ):
        """Step 3: Request access token using client credentials.

        Uses the client credentials from registration to obtain a JWT token.
        Token is stored in the shared context for subsequent API calls.
        """
        assert api_flow_context.has_client_credentials(), (
            "Client credentials not available. Run test_02_register_client first."
        )

        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                "/api/v1/auth/token",
                data={
                    "grant_type": "client_credentials",
                    "client_id": api_flow_context.client_id,
                    "client_secret": api_flow_context.client_secret,
                },
            )

        assert response.status_code == 200, f"Token request failed: {response.text}"

        data = response.json()

        # Verify response structure
        assert "access_token" in data
        assert data["token_type"] == "Bearer"
        assert data["expires_in"] > 0
        assert "scope" in data

        # Verify JWT structure
        parts = data["access_token"].split(".")
        assert len(parts) == 3, "Token should be valid JWT format"

        # Store token in context for subsequent tests
        api_flow_context.access_token = data["access_token"]
        api_flow_context.token_type = data["token_type"]
        api_flow_context.expires_in = data["expires_in"]
        api_flow_context.scope = data["scope"]

    def test_04_token_contains_granted_scopes(
        self,
        api_flow_context: APIFlowContext,  # noqa: W0621
    ):
        """Step 4: Verify token contains the expected scopes.

        Confirms that the granted scopes match the client's allowed scopes.
        """
        assert api_flow_context.has_access_token(), (
            "Access token not available. Run test_03_request_token first."
        )

        # Verify scopes match what was registered
        granted_scopes = api_flow_context.scope.split()
        for scope in api_flow_context.allowed_scopes:
            assert scope in granted_scopes, f"Expected scope '{scope}' not in token"

    def test_05_request_token_with_subset_scope(
        self,
        base_url: str,
        api_flow_context: APIFlowContext,  # noqa: W0621
    ):
        """Step 5: Request token with a subset of allowed scopes.

        Verifies that clients can request fewer scopes than allowed.
        """
        assert api_flow_context.has_client_credentials(), (
            "Client credentials not available. Run test_02_register_client first."
        )

        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                "/api/v1/auth/token",
                data={
                    "grant_type": "client_credentials",
                    "client_id": api_flow_context.client_id,
                    "client_secret": api_flow_context.client_secret,
                    "scope": "catalog:read",
                },
            )

        assert response.status_code == 200, f"Token request failed: {response.text}"

        data = response.json()
        assert data["scope"] == "catalog:read"

    def test_06_reject_unauthorized_scope(
        self,
        base_url: str,
        api_flow_context: APIFlowContext,  # noqa: W0621
    ):
        """Step 6: Verify unauthorized scope is rejected.

        Confirms that clients cannot request scopes beyond their allowed set.
        """
        assert api_flow_context.has_client_credentials(), (
            "Client credentials not available. Run test_02_register_client first."
        )

        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                "/api/v1/auth/token",
                data={
                    "grant_type": "client_credentials",
                    "client_id": api_flow_context.client_id,
                    "client_secret": api_flow_context.client_secret,
                    "scope": "admin:full",
                },
            )

        assert response.status_code == 400, f"Expected 400, got: {response.text}"

        data = response.json()
        assert data["detail"]["error"] == "invalid_scope"

    def test_07_reject_invalid_credentials(
        self,
        base_url: str,
        api_flow_context: APIFlowContext,  # noqa: W0621
    ):
        """Step 7: Verify invalid credentials are rejected.

        Confirms that token requests with wrong credentials fail properly.
        """
        
        assert api_flow_context.has_client_credentials(), (
            "Client credentials not available. Run test_02_register_client first."
        )

        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                "/api/v1/auth/token",
                data={
                    "grant_type": "client_credentials",
                    "client_id": api_flow_context.client_id,
                    "client_secret": generate_test_client_secret(),
                },
            )

        assert response.status_code == 401, f"Expected 401, got: {response.text}"

        data = response.json()
        assert data["detail"]["error"] == "invalid_client"

    def test_08_multiple_tokens_are_unique(
        self,
        base_url: str,
        api_flow_context: APIFlowContext,  # noqa: W0621
    ):
        """Step 8: Verify each token request generates a unique token.

        Confirms that tokens have unique identifiers (jti claim).
        """
        assert api_flow_context.has_client_credentials(), (
            "Client credentials not available. Run test_02_register_client first."
        )

        tokens = []
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            for _ in range(3):
                response = client.post(
                    "/api/v1/auth/token",
                    data={
                        "grant_type": "client_credentials",
                        "client_id": api_flow_context.client_id,
                        "client_secret": api_flow_context.client_secret,
                    },
                )
                assert response.status_code == 200
                tokens.append(response.json()["access_token"])

        # All tokens should be unique
        assert len(set(tokens)) == 3, "All tokens should be unique"


@pytest.mark.e2e
@pytest.mark.integration
class TestAPIFlowErrorHandling:
    """Test error handling across the OAuth2 authentication flow.

    These tests verify proper error responses for various failure scenarios:
    - Registration without/with invalid authentication
    - Token requests for unregistered clients
    - Invalid grant types and credentials
    - Format validation for client credentials

    Each test ensures that error responses are appropriate and secure,
    without exposing sensitive information.
    """

    def test_register_without_auth_fails(
        self,
        base_url: str,
        reset_vault,  # noqa: W0613 pylint: disable=unused-argument
    ):
        """Verify registration without authentication fails."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                "/api/v1/auth/register",
                json={"client_name": "unauthorized-client"},
            )

        assert response.status_code == 401, f"Expected 401, got: {response.text}"

    def test_register_with_invalid_auth_fails(
        self,
        base_url: str,
        invalid_auth_header: Dict[str, str],
        reset_vault,  # noqa: W0613 pylint: disable=unused-argument
    ):
        """Verify registration with invalid credentials fails."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                "/api/v1/auth/register",
                headers=invalid_auth_header,
                json={"client_name": "invalid-auth-client"},
            )

        assert response.status_code == 401, f"Expected 401, got: {response.text}"

    def test_token_without_registration_fails(
        self,
        base_url: str,
        reset_vault,  # noqa: W0613 pylint: disable=unused-argument
    ):
        """Verify token request for unregistered client fails."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                "/api/v1/auth/token",
                data={
                    "grant_type": "client_credentials",
                    "client_id": "bld_nonexistent_client_12345678",
                    "client_secret": generate_test_client_secret(),
                },
            )

        assert response.status_code == 401, f"Expected 401, got: {response.text}"

        data = response.json()
        assert data["detail"]["error"] == "invalid_client"

    def test_token_with_invalid_grant_type_fails(
        self,
        base_url: str,
        valid_auth_header: Dict[str, str],
        reset_vault,  # noqa: W0613 pylint: disable=unused-argument
    ):
        """Verify token request with unsupported grant type fails."""
        # First register a client
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            reg_response = client.post(
                "/api/v1/auth/register",
                headers=valid_auth_header,
                json={"client_name": "grant-type-test-client"},
            )
            assert reg_response.status_code == 201

            creds = reg_response.json()

            # Try token with invalid grant type
            response = client.post(
                "/api/v1/auth/token",
                data={
                    "grant_type": "authorization_code",
                    "client_id": creds["client_id"],
                    "client_secret": creds["client_secret"],
                },
            )

        assert response.status_code == 422, f"Expected 422, got: {response.text}"


@pytest.mark.e2e
@pytest.mark.integration
class TestAPIFlowSecurityValidation:
    """Security validation tests for the OAuth2 authentication flow.

    These tests verify that security measures are properly enforced:
    - Client credential format validation
    - Maximum client limits enforcement
    - Proper error handling without information disclosure
    - Token security and uniqueness validation

    These tests ensure the authentication system follows security best practices
    and does not expose sensitive information in error responses.
    """

    def test_client_credentials_format_validation(
        self,
        base_url: str,
        reset_vault,  # noqa: W0613 pylint: disable=unused-argument
    ):
        """Verify client credential format validation."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            # Invalid client_id format
            response = client.post(
                "/api/v1/auth/token",
                data={
                    "grant_type": "client_credentials",
                    "client_id": generate_invalid_client_id(),
                    "client_secret": generate_test_client_secret(),
                },
            )

        assert response.status_code == 422, f"Expected 422, got: {response.text}"

    def test_client_secret_format_validation(
        self,
        base_url: str,
        reset_vault,  # noqa: W0613 pylint: disable=unused-argument
    ):
        """Verify client secret format validation."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                "/api/v1/auth/token",
                data={
                    "grant_type": "client_credentials",
                    "client_id": "bld_valid_format_client_id",
                    "client_secret": generate_invalid_client_secret(),
                },
            )

        assert response.status_code == 422, f"Expected 422, got: {response.text}"

    def test_max_clients_limit_enforced(
        self,
        base_url: str,
        valid_auth_header: Dict[str, str],
        reset_vault,  # noqa: W0613 pylint: disable=unused-argument
    ):
        """Verify maximum client limit is enforced."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            # Register first client
            response1 = client.post(
                "/api/v1/auth/register",
                headers=valid_auth_header,
                json={"client_name": "first-client"},
            )
            assert response1.status_code == 201

            # Try to register second client
            response2 = client.post(
                "/api/v1/auth/register",
                headers=valid_auth_header,
                json={"client_name": "second-client"},
            )

        assert response2.status_code == 409, f"Expected 409, got: {response2.text}"

        data = response2.json()
        assert data["detail"]["error"] == "max_clients_reached"


================================================
FILE: build_stream/tests/end_to_end/api/test_build_image_e2e.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""End-to-end tests for Build Image API."""

import json
import subprocess
import time
from pathlib import Path
from typing import Dict, Any

import pytest
import requests


class TestBuildImageE2E:
    """End-to-end tests for build image workflow."""

    BASE_URL = "http://localhost:8000"
    API_PREFIX = "/api/v1"
    AUTH_TOKEN = "test-e2e-token"
    REQUEST_TIMEOUT = 30

    @classmethod
    def setup_class(cls):
        """Setup class with server startup."""
        # Start the API server in background
        cls.server_process = subprocess.Popen(
            ["python", "main.py"],
            cwd="/opt/omnia/omnia/omnia_code/build_stream",
            stdout=subprocess.PIPE,
            stderr=subprocess.PIPE,
        )
        # Wait for server to start
        time.sleep(5)

        # Verify server is running
        try:
            response = requests.get(
                f"{cls.BASE_URL}/health",
                timeout=cls.REQUEST_TIMEOUT,
            )
            assert response.status_code == 200
        except requests.exceptions.ConnectionError:
            pytest.skip("API server not available")

    @classmethod
    def teardown_class(cls):
        """Cleanup by stopping server."""
        if hasattr(cls, 'server_process'):
            cls.server_process.terminate()
            cls.server_process.wait()

    def get_headers(self, correlation_id: str = None) -> Dict[str, str]:
        """Get request headers."""
        headers = {
            "Authorization": f"Bearer {self.AUTH_TOKEN}",
            "Content-Type": "application/json",
        }
        if correlation_id:
            headers["X-Correlation-Id"] = correlation_id
        return headers

    def test_full_build_image_workflow_x86_64(self):
        """Test complete build image workflow for x86_64."""
        correlation_id = "e2e-test-x86_64"
        headers = self.get_headers(correlation_id)

        # Step 1: Create a job
        create_job_response = requests.post(
            f"{self.BASE_URL}{self.API_PREFIX}/jobs",
            json={
                "stage": "build-image",
                "input_parameters": {
                    "architecture": "x86_64",
                    "image_key": "e2e-test-image",
                    "functional_groups": [
                        "slurm_control_node_x86_64",
                        "slurm_node_x86_64",
                        "login_node_x86_64"
                    ]
                }
            },
            headers=headers,
            timeout=self.REQUEST_TIMEOUT,
        )
        assert create_job_response.status_code == 201
        job_data = create_job_response.json()
        job_id = job_data["job_id"]
        assert job_id

        # Step 2: Verify job was created with build-image stage
        get_job_response = requests.get(
            f"{self.BASE_URL}{self.API_PREFIX}/jobs/{job_id}",
            headers=headers,
            timeout=self.REQUEST_TIMEOUT,
        )
        assert get_job_response.status_code == 200
        job_detail = get_job_response.json()
        stages = {stage["stage_name"]: stage for stage in job_detail["stages"]}
        assert "build-image" in stages
        assert stages["build-image"]["status"] == "PENDING"

        # Step 3: Trigger build image stage
        build_image_response = requests.post(
            f"{self.BASE_URL}{self.API_PREFIX}/jobs/{job_id}/stages/build-image",
            json={
                "architecture": "x86_64",
                "image_key": "e2e-test-image",
                "functional_groups": [
                    "slurm_control_node_x86_64",
                    "slurm_node_x86_64",
                    "login_node_x86_64"
                ]
            },
            headers=headers
        )
        assert build_image_response.status_code == 202
        build_data = build_image_response.json()
        assert build_data["job_id"] == job_id
        assert build_data["stage"] == "build-image"
        assert build_data["status"] == "accepted"
        assert build_data["architecture"] == "x86_64"
        assert build_data["image_key"] == "e2e-test-image"
        assert len(build_data["functional_groups"]) == 3

        # Step 4: Verify stage is now STARTED
        get_job_response2 = requests.get(
            f"{self.BASE_URL}{self.API_PREFIX}/jobs/{job_id}",
            headers=headers,
            timeout=self.REQUEST_TIMEOUT,
        )
        assert get_job_response2.status_code == 200
        job_detail2 = get_job_response2.json()
        stages2 = {stage["stage_name"]: stage for stage in job_detail2["stages"]}
        assert stages2["build-image"]["status"] == "STARTED"

        # Step 5: Verify request file in queue
        queue_dir = Path("/opt/omnia/build_stream/queue/requests")
        request_files = list(queue_dir.glob(f"{job_id}_build-image_*.json"))
        assert len(request_files) == 1

        # Verify request file content
        request_data = json.loads(request_files[0].read_text())
        assert request_data["job_id"] == job_id
        assert request_data["architecture"] == "x86_64"
        assert request_data["image_key"] == "e2e-test-image"
        assert request_data["functional_groups"] == [
            "slurm_control_node_x86_64",
            "slurm_node_x86_64",
            "login_node_x86_64"
        ]
        assert request_data["playbook_path"] == "/omnia/build_image_x86_64/build_image_x86_64.yml"
        assert request_data["correlation_id"] == correlation_id

        # Step 6: Verify playbook command generation
        with open(request_files[0], "r", encoding="utf-8") as f:
            request_content = json.load(f)
        
        # The request should contain all necessary fields for playbook execution
        assert "request_id" in request_content
        assert "timeout_minutes" in request_content
        assert "submitted_at" in request_content
        assert "inventory_file_path" not in request_content  # Not needed for x86_64
        
        # Step 7: Verify stage naming (should be build-image-x86_64)
        assert request_content["stage_name"] == "build-image-x86_64"

    def test_full_build_image_workflow_aarch64(self):
        """Test complete build image workflow for aarch64."""
        correlation_id = "e2e-test-aarch64"
        headers = self.get_headers(correlation_id)

        # Step 1: Create a job
        create_job_response = requests.post(
            f"{self.BASE_URL}{self.API_PREFIX}/jobs",
            json={
                "stage": "build-image",
                "input_parameters": {
                    "architecture": "aarch64",
                    "image_key": "e2e-test-image-arm",
                    "functional_groups": [
                        "slurm_control_node_aarch64",
                        "slurm_node_aarch64"
                    ]
                }
            },
            headers=headers
        )
        assert create_job_response.status_code == 201
        job_data = create_job_response.json()
        job_id = job_data["job_id"]

        # Step 2: Create build_stream_config.yml with inventory host
        # Use the consolidated repository path structure
        input_dir = Path("/opt/omnia/input/project_default")
        input_dir.mkdir(parents=True, exist_ok=True)
        
        # Create default.yml for project name resolution
        default_file = Path("/opt/omnia/input/default.yml")
        default_file.write_text("project_name: project_default\n", encoding="utf-8")
        
        config_file = input_dir / "build_stream_config.yml"
        config_file.write_text("aarch64_inventory_host: 10.3.0.170\n", encoding="utf-8")

        # Step 3: Trigger build image stage
        build_image_response = requests.post(
            f"{self.BASE_URL}{self.API_PREFIX}/jobs/{job_id}/stages/build-image",
            json={
                "architecture": "aarch64",
                "image_key": "e2e-test-image-arm",
                "functional_groups": [
                    "slurm_control_node_aarch64",
                    "slurm_node_aarch64"
                ]
            },
            headers=headers
        )
        assert build_image_response.status_code == 202
        build_data = build_image_response.json()
        assert build_data["architecture"] == "aarch64"

        # Step 4: Verify request file and inventory file creation
        queue_dir = Path("/opt/omnia/build_stream/queue/requests")
        request_files = list(queue_dir.glob(f"{job_id}_build-image_*.json"))
        assert len(request_files) == 1

        request_data = json.loads(request_files[0].read_text(encoding="utf-8"))
        assert request_data["playbook_path"] == "build_image_aarch64.yml"  # Only filename, not full path
        
        # Step 5: Verify inventory file was created by consolidated repository
        inventory_dir = Path("/opt/omnia/build_stream_inv")
        inventory_file = inventory_dir / job_id / "inv"
        assert inventory_file.exists(), "Inventory file should be created"
        
        # Verify inventory file content
        with open(inventory_file, 'r') as f:
            inventory_content = f.read()
        assert "10.3.0.170" in inventory_content, f"Inventory file should contain host IP: {inventory_content}"
        assert "[build_hosts]" in inventory_content, f"Inventory file should have proper format: {inventory_content}"
        
        # Step 6: Verify stage naming (should be build-image-aarch64)
        with open(request_files[0], "r", encoding="utf-8") as f:
            request_content = json.load(f)
        assert request_content["stage_name"] == "build-image-aarch64"
        
        # Step 7: Verify inventory_file_path is included in request
        assert "inventory_file_path" in request_content
        assert request_content["inventory_file_path"] == str(inventory_file)

    def test_consolidated_repository_functionality(self):
        """Test consolidated NfsInputRepository functionality."""
        correlation_id = "e2e-test-consolidated-repo"
        headers = self.get_headers(correlation_id)

        # Step 1: Create a job
        create_job_response = requests.post(
            f"{self.BASE_URL}{self.API_PREFIX}/jobs",
            json={
                "stage": "build-image",
                "input_parameters": {
                    "architecture": "aarch64",
                    "image_key": "e2e-consolidated-test",
                    "functional_groups": ["slurm_control_node_aarch64"]
                }
            },
            headers=headers
        )
        assert create_job_response.status_code == 201
        job_data = create_job_response.json()
        job_id = job_data["job_id"]

        # Step 2: Setup consolidated repository paths
        input_dir = Path("/opt/omnia/input")
        input_dir.mkdir(parents=True, exist_ok=True)
        
        # Create default.yml for project name resolution
        default_file = input_dir / "default.yml"
        default_file.write_text("project_name: project_default\n", encoding="utf-8")
        
        # Create config with correct key name
        config_file = input_dir / "project_default" / "build_stream_config.yml"
        config_file.parent.mkdir(parents=True, exist_ok=True)
        config_file.write_text("aarch64_inventory_host: 192.168.1.200\n", encoding="utf-8")

        # Step 3: Trigger build image stage
        build_image_response = requests.post(
            f"{self.BASE_URL}{self.API_PREFIX}/jobs/{job_id}/stages/build-image",
            json={
                "architecture": "aarch64",
                "image_key": "e2e-consolidated-test",
                "functional_groups": ["slurm_control_node_aarch64"]
            },
            headers=headers
        )
        assert build_image_response.status_code == 202

        # Step 4: Verify consolidated repository functionality
        # 4a: Verify config reading works
        queue_dir = Path("/opt/omnia/build_stream/queue/requests")
        request_files = list(queue_dir.glob(f"{job_id}_build-image_*.json"))
        assert len(request_files) == 1
        
        # 4b: Verify inventory file creation
        inventory_dir = Path("/opt/omnia/build_stream_inv")
        inventory_file = inventory_dir / job_id / "inv"
        assert inventory_file.exists(), "Consolidated repository should create inventory file"
        
        # 4c: Verify inventory file content
        with open(inventory_file, 'r') as f:
            content = f.read()
        assert "192.168.1.200" in content
        assert "[build_hosts]" in content
        
        # 4d: Verify input directory paths work
        build_stream_dir = Path("/opt/omnia/build_stream")
        source_path = build_stream_dir / job_id / "input"
        dest_path = input_dir / "project_default"
        
        # These paths should be accessible through the consolidated repository
        assert dest_path.exists(), "Destination input directory should exist"
        
        # 4e: Verify request contains correct playbook filename (not full path)
        with open(request_files[0], "r", encoding="utf-8") as f:
            request_content = json.load(f)
        assert request_content["playbook_path"] == "build_image_aarch64.yml"
        assert request_content["stage_name"] == "build-image-aarch64"
        assert "inventory_file_path" in request_content

    def test_build_image_error_cases(self):
        """Test various error scenarios."""
        correlation_id = "e2e-test-errors"
        headers = self.get_headers(correlation_id)

        # Test 1: Invalid architecture
        create_job_response = requests.post(
            f"{self.BASE_URL}{self.API_PREFIX}/jobs",
            json={
                "stage": "build-image",
                "input_parameters": {
                    "architecture": "x86_64",
                    "image_key": "test-image",
                    "functional_groups": ["group1"]
                }
            },
            headers=headers
        )
        job_id = create_job_response.json()["job_id"]

        error_response = requests.post(
            f"{self.BASE_URL}{self.API_PREFIX}/jobs/{job_id}/stages/build-image",
            json={
                "architecture": "invalid_arch",
                "image_key": "test-image",
                "functional_groups": ["group1"]
            },
            headers=headers
        )
        assert error_response.status_code == 400
        assert error_response.json()["error"] == "INVALID_ARCHITECTURE"

        # Test 2: Missing inventory host for aarch64
        create_job_response2 = requests.post(
            f"{self.BASE_URL}{self.API_PREFIX}/jobs",
            json={
                "stage": "build-image",
                "input_parameters": {
                    "architecture": "aarch64",
                    "image_key": "test-image",
                    "functional_groups": ["group1"]
                }
            },
            headers=headers
        )
        job_id2 = create_job_response2.json()["job_id"]

        # Don't create config file (no inventory host)
        error_response2 = requests.post(
            f"{self.BASE_URL}{self.API_PREFIX}/jobs/{job_id2}/stages/build-image",
            json={
                "architecture": "aarch64",
                "image_key": "test-image",
                "functional_groups": ["group1"]
            },
            headers=headers
        )
        assert error_response2.status_code == 400
        assert error_response2.json()["error"] == "INVENTORY_HOST_MISSING"

    def test_build_image_concurrent_requests(self):
        """Test handling concurrent build image requests."""
        correlation_id = "e2e-test-concurrent"
        headers = self.get_headers(correlation_id)

        # Create multiple jobs
        job_ids = []
        for i in range(3):
            response = requests.post(
                f"{self.BASE_URL}{self.API_PREFIX}/jobs",
                json={
                    "stage": "build-image",
                    "input_parameters": {
                        "architecture": "x86_64",
                        "image_key": f"concurrent-image-{i}",
                        "functional_groups": [f"group{i}"]
                    }
                },
                headers=headers,
                timeout=self.REQUEST_TIMEOUT,
            )
            job_ids.append(response.json()["job_id"])

        # Submit build image requests concurrently
        import concurrent.futures

        def submit_build_image(job_id):
            return requests.post(
                f"{self.BASE_URL}{self.API_PREFIX}/jobs/{job_id}/stages/build-image",
                json={
                    "architecture": "x86_64",
                    "image_key": f"concurrent-image-{job_id}",
                    "functional_groups": [f"group{job_id}"]
                },
                headers=headers
            )

        with concurrent.futures.ThreadPoolExecutor(max_workers=3) as executor:
            futures = [executor.submit(submit_build_image, job_id) for job_id in job_ids]
            responses = [future.result() for future in futures]

        # All requests should succeed
        for response in responses:
            assert response.status_code == 202

        # Verify all requests are in queue
        queue_dir = Path("/opt/omnia/build_stream/queue/requests")
        request_files = list(queue_dir.glob("*_build-image_*.json"))
        assert len(request_files) >= 3  # At least our 3 requests

    def test_build_image_audit_trail(self):
        """Test that build image operations create audit events."""
        correlation_id = "e2e-test-audit"
        headers = self.get_headers(correlation_id)

        # Create job and trigger build image
        create_job_response = requests.post(
            f"{self.BASE_URL}{self.API_PREFIX}/jobs",
            json={
                "stage": "build-image",
                "input_parameters": {
                    "architecture": "x86_64",
                    "image_key": "audit-test-image",
                    "functional_groups": ["group1"]
                }
            },
            headers=headers
        )
        job_id = create_job_response.json()["job_id"]

        build_image_response = requests.post(
            f"{self.BASE_URL}{self.API_PREFIX}/jobs/{job_id}/stages/build-image",
            json={
                "architecture": "x86_64",
                "image_key": "audit-test-image",
                "functional_groups": ["group1"]
            },
            headers=headers
        )
        assert build_image_response.status_code == 202

        # Check audit events
        audit_response = requests.get(
            f"{self.BASE_URL}{self.API_PREFIX}/jobs/{job_id}/audit",
            headers=headers,
            timeout=self.REQUEST_TIMEOUT,
        )
        assert audit_response.status_code == 200
        audit_events = audit_response.json()

        # Should have STAGE_STARTED event for build-image
        build_image_events = [
            event for event in audit_events
            if event["event_type"] == "STAGE_STARTED" and 
               event["details"]["stage_name"] == "build-image"
        ]
        assert len(build_image_events) == 1
        assert build_image_events[0]["details"]["architecture"] == "x86_64"
        assert build_image_events[0]["details"]["image_key"] == "audit-test-image"


================================================
FILE: build_stream/tests/end_to_end/api/test_generate_input_files_e2e.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""End-to-end tests for Generate Input Files complete workflow.

These tests validate the complete generate input files workflow using real OAuth2
authentication instead of mocks. The tests follow the chronological order:
1. Health check
2. Client registration
3. Token generation
4. Job creation
5. Parse catalog execution (prerequisite)
6. Generate input files execution
7. Error handling and edge cases

Requirements:
    - ansible-vault must be installed
    - Tests require write access to create temporary vault files
    - RSA keys must be available for JWT signing
"""

import json
import os
import uuid
from typing import Dict, Any, Optional

import pytest
import httpx

from core.jobs.value_objects import CorrelationId


class GenerateInputFilesContext:
    """Context object to store state across generate input files tests.

    This class maintains state between test steps, allowing tests to
    share data like client credentials, access tokens, and job IDs.

    Attributes:
        client_id: Registered client identifier.
        client_secret: Registered client secret.
        access_token: Generated JWT access token.
        job_id: Created job ID for generate input files testing.
        catalog_content: Valid catalog content for testing.
    """

    def __init__(self):
        """Initialize empty context."""
        self.client_id: Optional[str] = None
        self.client_secret: Optional[str] = None
        self.client_name: Optional[str] = None
        self.allowed_scopes: Optional[list] = None
        self.access_token: Optional[str] = None
        self.token_type: Optional[str] = None
        self.expires_in: Optional[int] = None
        self.scope: Optional[str] = None
        self.job_id: Optional[str] = None
        self.catalog_content: Optional[bytes] = None

    def has_client_credentials(self) -> bool:
        """Check if client credentials are available."""
        return self.client_id is not None and self.client_secret is not None

    def has_access_token(self) -> bool:
        """Check if access token is available."""
        return self.access_token is not None

    def has_job_id(self) -> bool:
        """Check if job ID is available."""
        return self.job_id is not None

    def get_auth_header(self) -> Dict[str, str]:
        """Get Authorization header with Bearer token.

        Returns:
            Dictionary with Authorization header.

        Raises:
            ValueError: If access token is not available.
        """
        if not self.has_access_token():
            raise ValueError("Access token not available")
        return {"Authorization": f"Bearer {self.access_token}"}

    def set_job_id(self, job_id: str) -> None:
        """Set the job ID for testing."""
        self.job_id = job_id

    def load_catalog_content(self) -> str:
        """Load catalog content for testing.
        
        Returns:
            JSON string of catalog content.
        """
        # Use the proper catalog_rhel fixture instead of a minimal catalog
        catalog_path = os.path.join(
            os.path.dirname(__file__),
            "..", "..", "fixtures", "catalogs", "catalog_rhel.json"
        )
        
        with open(catalog_path, "r", encoding="utf-8") as f:
            content = f.read()
            # Store the content as bytes for upload
            self.catalog_content = content.encode('utf-8')
            return content

    def get_catalog_bytes(self) -> bytes:
        """Get catalog content as bytes."""
        return self.catalog_content


@pytest.fixture(scope="class")
def generate_input_files_context():
    """Create a shared context for generate input files tests.

    Returns:
        GenerateInputFilesContext instance for sharing state across tests.
    """
    return GenerateInputFilesContext()


class TestGenerateInputFilesE2E:

    """End-to-end tests for Generate Input Files complete workflow.

    Tests are ordered to follow the natural workflow:
    1. Health check - Verify server is running
    2. Client registration - Register OAuth client with catalog scopes
    3. Token generation - Obtain JWT access token
    4. Job creation - Create a job for generate input files
    5. Parse catalog execution - Execute parse catalog stage (prerequisite)
    6. Generate input files execution - Execute generate input files stage
    7. Error handling - Test various failure scenarios

    Tests use pytest.mark.e2e and depend on fixtures from conftest.py.
    """

    @pytest.mark.e2e
    def test_01_health_check(self, base_url: str):
        """Step 1: Verify server health.

        Confirms the API server is running and accessible before proceeding
        with authentication and workflow tests.
        """
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.get("/health")

        assert response.status_code == 200, f"Health check failed: {response.text}"

        data = response.json()
        assert data["status"] == "healthy"

    @pytest.mark.e2e
    def test_02_register_client_for_generate_input_files(
        self,
        base_url: str,
        valid_auth_header: Dict[str, str],
        generate_input_files_context: GenerateInputFilesContext,  # noqa: W0621
    ):
        """Step 2: Register a new OAuth client for generate input files access.

        This creates a client that will be used for subsequent generate input files requests.
        Client credentials are stored in the shared context.
        """
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                "/api/v1/auth/register",
                headers=valid_auth_header,
                json={
                    "client_name": "generate-input-files-test-client",
                    "description": "Client for generate input files testing",
                    "allowed_scopes": ["catalog:read", "catalog:write"],
                },
            )

        assert response.status_code == 201, f"Registration failed: {response.text}"

        data = response.json()

        # Verify response structure
        assert "client_id" in data
        assert "client_secret" in data
        assert data["client_id"].startswith("bld_")
        assert data["client_secret"].startswith("bld_s_")

        # Store credentials in context for subsequent tests
        generate_input_files_context.client_id = data["client_id"]
        generate_input_files_context.client_secret = data["client_secret"]
        generate_input_files_context.client_name = data["client_name"]
        generate_input_files_context.allowed_scopes = data["allowed_scopes"]

    @pytest.mark.e2e
    def test_03_request_token_for_generate_input_files(
        self,
        base_url: str,
        generate_input_files_context: GenerateInputFilesContext,  # noqa: W0621
    ):
        """Step 3: Request access token for generate input files API.

        Uses the client credentials from registration to obtain a JWT token.
        Token is stored in the shared context for subsequent API calls.
        """
        assert generate_input_files_context.has_client_credentials(), (
            "Client credentials not available. Run test_02_register_client_for_generate_input_files first."
        )

        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                "/api/v1/auth/token",
                data={
                    "grant_type": "client_credentials",
                    "client_id": generate_input_files_context.client_id,
                    "client_secret": generate_input_files_context.client_secret,
                },
            )

        assert response.status_code == 200, f"Token request failed: {response.text}"

        data = response.json()

        # Verify response structure
        assert "access_token" in data
        assert data["token_type"] == "Bearer"
        assert data["expires_in"] > 0
        assert "scope" in data

        # Verify JWT structure
        parts = data["access_token"].split(".")
        assert len(parts) == 3, "Token should be valid JWT format"

        # Store token in context for subsequent tests
        generate_input_files_context.access_token = data["access_token"]
        generate_input_files_context.token_type = data["token_type"]
        generate_input_files_context.expires_in = data["expires_in"]
        generate_input_files_context.scope = data["scope"]

    @pytest.mark.e2e
    def test_04_create_job_for_generate_input_files(
        self,
        base_url: str,
        generate_input_files_context: GenerateInputFilesContext,  # noqa: W0621
    ):
        """Step 4: Create a new job for generate input files testing.

        Tests job creation with proper validation and idempotency.
        """
        assert generate_input_files_context.has_access_token(), (
            "Access token not available. Run test_03_request_token_for_generate_input_files first."
        )

        # Prepare job creation request
        job_data = {
            "client_id": generate_input_files_context.client_id,
            "client_name": "Generate Input Files Test Client"
        }

        idempotency_key = str(uuid.uuid4())
        headers = generate_input_files_context.get_auth_header()
        headers["Idempotency-Key"] = idempotency_key

        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                "/api/v1/jobs",
                json=job_data,
                headers=headers,
            )

        assert response.status_code == 201, f"Job creation failed: {response.text}"

        data = response.json()

        # Verify response structure
        assert "job_id" in data
        assert "job_state" in data
        assert "created_at" in data
        assert "correlation_id" in data

        # Verify job ID format (UUID)
        uuid.UUID(data["job_id"])  # This will raise ValueError if not valid UUID

        # Store job ID in context
        generate_input_files_context.set_job_id(data["job_id"])

        # Verify job state
        assert data["job_state"] == "CREATED"

    @pytest.mark.e2e
    def test_05_parse_catalog_prerequisite(
        self,
        base_url: str,
        generate_input_files_context: GenerateInputFilesContext,  # noqa: W0621
    ):
        """Step 5: Execute parse catalog as prerequisite for generate input files.

        Parse catalog must be executed successfully before generate input files
        can be run, as it depends on the catalog artifacts.
        """
        assert generate_input_files_context.has_access_token(), (
            "Access token not available. Run test_03_request_token_for_generate_input_files first."
        )
        assert generate_input_files_context.has_job_id(), (
            "Job ID not available. Run test_04_create_job_for_generate_input_files first."
        )

        # Load catalog content
        generate_input_files_context.load_catalog_content()
        assert generate_input_files_context.catalog_content is not None

        headers = generate_input_files_context.get_auth_header()

        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                f"/api/v1/jobs/{generate_input_files_context.job_id}/stages/parse-catalog",
                files={
                    "file": (
                        "catalog.json", 
                        generate_input_files_context.catalog_content,
                        "application/json"
                    )
                },
                headers=headers,
            )

        # The response should indicate the stage was processed successfully
        assert response.status_code == 200, (
            f"Parse catalog failed: {response.text}"
        )

        # Get response data for verification
        response_data = response.json()

        # Verify the response structure
        assert "status" in response_data
        assert response_data["status"] == "success"
        assert "message" in response_data

    @pytest.mark.e2e
    def test_06_generate_input_files_success(
        self,
        base_url: str,
        generate_input_files_context: GenerateInputFilesContext,  # noqa: W0621
    ):
        """Step 6: Execute generate input files successfully.

        Tests the complete generate input files workflow with default policy.
        This depends on parse catalog having been executed first.
        """
        assert generate_input_files_context.has_access_token(), (
            "Access token not available. Run test_03_request_token_for_generate_input_files first."
        )
        assert generate_input_files_context.has_job_id(), (
            "Job ID not available. Run test_04_create_job_for_generate_input_files first."
        )

        headers = generate_input_files_context.get_auth_header()

        # Execute generate input files with default policy
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                f"/api/v1/jobs/{generate_input_files_context.job_id}/stages/generate-input-files",
                headers=headers,
            )

        # Should process the request successfully
        # Tests should fail on any error (including 500)
        assert response.status_code == 200, (
            f"Generate input files failed with status {response.status_code}: {response.text}"
        )
        
        # Verify minimal response structure
        response_data = response.json()
        assert "stage_state" in response_data
        assert response_data["stage_state"] in ["COMPLETED", "FAILED"]
        
        if response_data["stage_state"] == "COMPLETED":
            # Should have only these three fields
            assert "job_id" in response_data
            assert "message" in response_data
            assert "stage_state" in response_data
            print(f"✅ Generate input files completed successfully!")
            print(f"Response: {response_data}")
        else:
            print(f"⚠️ Generate input files completed with stage state: {response_data['stage_state']}")
        

    @pytest.mark.e2e
    def test_07_generate_input_files_with_custom_policy(
        self,
        base_url: str,
        generate_input_files_context: GenerateInputFilesContext,  # noqa: W0621
    ):

        """Step 7: Test generate input files with custom adapter policy.

        Tests error handling and various policy path scenarios.
        """
        assert generate_input_files_context.has_access_token(), (
            "Access token not available. Run test_03_request_token_for_generate_input_files first."
        )
        assert generate_input_files_context.has_job_id(), (
            "Job ID not available. Run test_04_create_job_for_generate_input_files first."
        )

        headers = generate_input_files_context.get_auth_header()

        # Test with invalid policy path
        invalid_request = {
            "adapter_policy_path": "../../../etc/passwd"
        }

        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            error_response = client.post(
                f"/api/v1/jobs/{generate_input_files_context.job_id}/stages/generate-input-files",
                json=invalid_request,
                headers=headers,
            )

        # Should reject invalid path
        assert error_response.status_code in [400, 422], (
            f"Expected rejection of invalid policy path: {error_response.text}"
        )
        # Create a fresh job to avoid STAGE_ALREADY_COMPLETED
        job_data = {
            "client_id": generate_input_files_context.client_id,
            "client_name": "Generate Input Files Test Client (recovery)"
        }

        new_idempotency_key = str(uuid.uuid4())
        new_headers = headers.copy()
        new_headers["Idempotency-Key"] = new_idempotency_key

        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            job_response = client.post(
                "/api/v1/jobs",
                json=job_data,
                headers=new_headers,
            )

        assert job_response.status_code == 201, f"Job creation failed: {job_response.text}"
        new_job_id = job_response.json()["job_id"]

        # Parse catalog for the new job (prerequisite)
        generate_input_files_context.load_catalog_content()
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            parse_response = client.post(
                f"/api/v1/jobs/{new_job_id}/stages/parse-catalog",
                files={
                    "file": (
                        "catalog.json",
                        generate_input_files_context.catalog_content,
                        "application/json",
                    )
                },
                headers=headers,
            )

        assert parse_response.status_code == 200, (
            f"Parse catalog failed for recovery job: {parse_response.text}"
        )

        # Test with valid request (default policy) on the fresh job
        with httpx.Client(base_url=base_url, timeout=3000.0) as client:
            recovery_response = client.post(
                f"/api/v1/jobs/{new_job_id}/stages/generate-input-files",
                headers=headers,
            )

        # Should process the valid request
        assert recovery_response.status_code in [200, 400, 422, 500], (
            f"Valid request failed: {recovery_response.text}"
        )


================================================
FILE: build_stream/tests/end_to_end/api/test_parse_catalog_e2e.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""End-to-end tests for Parse Catalog workflow with real authentication.

These tests validate the complete parse catalog workflow using real OAuth2
authentication instead of mocks. The tests follow the chronological order:
1. Health check
2. Client registration
3. Token generation
4. Job creation
5. Parse catalog execution
6. Error handling and edge cases

Usage:
    pytest tests/end_to_end/api/test_parse_catalog_e2e.py -v -m e2e

Requirements:
    - ansible-vault must be installed
    - Tests require write access to create temporary vault files
    - RSA keys must be available for JWT signing
"""

import json
import os
import uuid
from typing import Dict, Optional

import httpx
import pytest


class ParseCatalogContext:  # pylint: disable=too-many-instance-attributes
    """Context object to store state across parse catalog tests.

    This class maintains state between test steps, allowing tests to
    share data like client credentials, access tokens, and job IDs.

    Attributes:
        client_id: Registered client identifier.
        client_secret: Registered client secret.
        access_token: Generated JWT access token.
        job_id: Created job ID for parse catalog testing.
        catalog_content: Valid catalog content for testing.
    """

    def __init__(self):
        """Initialize empty context."""
        self.client_id: Optional[str] = None
        self.client_secret: Optional[str] = None
        self.client_name: Optional[str] = None
        self.allowed_scopes: Optional[list] = None
        self.access_token: Optional[str] = None
        self.token_type: Optional[str] = None
        self.expires_in: Optional[int] = None
        self.scope: Optional[str] = None
        self.job_id: Optional[str] = None
        self.catalog_content: Optional[bytes] = None

    def has_client_credentials(self) -> bool:
        """Check if client credentials are available."""
        return self.client_id is not None and self.client_secret is not None

    def has_access_token(self) -> bool:
        """Check if access token is available."""
        return self.access_token is not None

    def has_job_id(self) -> bool:
        """Check if job ID is available."""
        return self.job_id is not None

    def get_auth_header(self) -> Dict[str, str]:
        """Get Authorization header with Bearer token.

        Returns:
            Dictionary with Authorization header.

        Raises:
            ValueError: If access token is not available.
        """
        if not self.has_access_token():
            raise ValueError("Access token not available")
        return {"Authorization": f"Bearer {self.access_token}"}

    def set_job_id(self, job_id: str) -> None:
        """Set the job ID for testing."""
        self.job_id = job_id

    def load_catalog_content(self) -> None:
        """Load valid catalog content from fixtures."""
        here = os.path.dirname(__file__)
        # Go up from end_to_end/api/ to tests/ then to fixtures/
        fixtures_dir = os.path.dirname(os.path.dirname(here))
        catalog_path = os.path.join(fixtures_dir, "fixtures", "catalogs", "catalog_rhel.json")

        with open(catalog_path, 'r', encoding='utf-8') as f:
            catalog_data = json.load(f)

        self.catalog_content = json.dumps(catalog_data, indent=2).encode('utf-8')


@pytest.fixture(scope="class")
def parse_catalog_context():
    """Create a shared context for parse catalog tests.

    Returns:
        ParseCatalogContext instance shared across test class.
    """
    return ParseCatalogContext()


@pytest.mark.e2e
@pytest.mark.integration
class TestParseCatalogWorkflow:
    """End-to-end test suite for parse catalog workflow.

    Tests are ordered to follow the natural workflow:
    1. Health check - Verify server is running
    2. Client registration - Register OAuth client with catalog scopes
    3. Token generation - Obtain JWT access token
    4. Job creation - Create a job for parse catalog
    5. Parse catalog execution - Execute parse catalog stage
    6. Error handling - Test various failure scenarios

    Each test builds on the previous, storing state in the shared context.
    """

    def test_01_health_check(
        self,
        base_url: str,
        reset_vault,  # noqa: W0613 pylint: disable=unused-argument
    ):
        """Step 1: Verify server health endpoint is accessible.

        This confirms the server is running and ready to accept requests.
        """
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.get("/health")

        assert response.status_code == 200, f"Health check failed: {response.text}"

        data = response.json()
        assert data["status"] == "healthy"

    def test_02_register_client_for_parse_catalog(
        self,
        base_url: str,
        valid_auth_header: Dict[str, str],
        parse_catalog_context: ParseCatalogContext,  # noqa: W0621
    ):
        """Step 2: Register a new OAuth client for parse catalog access.

        This creates a client that will be used for subsequent parse catalog requests.
        Client credentials are stored in the shared context.
        """
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                "/api/v1/auth/register",
                headers=valid_auth_header,
                json={
                    "client_name": "parse-catalog-test-client",
                    "description": "Client for parse catalog testing",
                    "allowed_scopes": ["catalog:read", "catalog:write"],
                },
            )

        assert response.status_code == 201, f"Registration failed: {response.text}"

        data = response.json()

        # Verify response structure
        assert "client_id" in data
        assert "client_secret" in data
        assert data["client_id"].startswith("bld_")
        assert data["client_secret"].startswith("bld_s_")

        # Store credentials in context for subsequent tests
        parse_catalog_context.client_id = data["client_id"]
        parse_catalog_context.client_secret = data["client_secret"]
        parse_catalog_context.client_name = data["client_name"]
        parse_catalog_context.allowed_scopes = data["allowed_scopes"]

    def test_03_request_token_for_parse_catalog(
        self,
        base_url: str,
        parse_catalog_context: ParseCatalogContext,  # noqa: W0621
    ):
        """Step 3: Request access token for parse catalog API.

        Uses the client credentials from registration to obtain a JWT token.
        Token is stored in the shared context for subsequent API calls.
        """
        assert parse_catalog_context.has_client_credentials(), (
            "Client credentials not available. Run test_02_register_client_for_parse_catalog first."
        )

        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                "/api/v1/auth/token",
                data={
                    "grant_type": "client_credentials",
                    "client_id": parse_catalog_context.client_id,
                    "client_secret": parse_catalog_context.client_secret,
                },
            )

        assert response.status_code == 200, f"Token request failed: {response.text}"

        data = response.json()

        # Verify response structure
        assert "access_token" in data
        assert data["token_type"] == "Bearer"
        assert data["expires_in"] > 0
        assert "scope" in data

        # Verify JWT structure
        parts = data["access_token"].split(".")
        assert len(parts) == 3, "Token should be valid JWT format"

        # Store token in context for subsequent tests
        parse_catalog_context.access_token = data["access_token"]
        parse_catalog_context.token_type = data["token_type"]
        parse_catalog_context.expires_in = data["expires_in"]
        parse_catalog_context.scope = data["scope"]

    def test_04_create_job_for_parse_catalog(
        self,
        base_url: str,
        parse_catalog_context: ParseCatalogContext,  # noqa: W0621
    ):
        """Step 4: Create a new job for parse catalog testing.

        Tests job creation with proper validation and idempotency.
        """
        assert parse_catalog_context.has_access_token(), (
            "Access token not available. Run test_03_request_token_for_parse_catalog first."
        )

        # Prepare job creation request
        job_data = {
            "client_id": parse_catalog_context.client_id,
            "client_name": "Parse Catalog Test Client"
        }

        idempotency_key = str(uuid.uuid4())
        headers = parse_catalog_context.get_auth_header()
        headers["Idempotency-Key"] = idempotency_key

        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                "/api/v1/jobs",
                json=job_data,
                headers=headers,
            )

        assert response.status_code == 201, f"Job creation failed: {response.text}"

        data = response.json()

        # Verify response structure
        assert "job_id" in data
        assert "job_state" in data
        assert "created_at" in data
        assert "correlation_id" in data

        # Verify job ID format (UUID)
        uuid.UUID(data["job_id"])  # This will raise ValueError if not valid UUID

        # Store job ID in context
        parse_catalog_context.set_job_id(data["job_id"])

        # Verify job state
        assert data["job_state"] == "CREATED"

    def test_05_parse_catalog_success(
        self,
        base_url: str,
        parse_catalog_context: ParseCatalogContext,  # noqa: W0621
    ):
        """Step 5: Execute parse catalog successfully.

        Tests the complete parse catalog workflow with a valid catalog file.
        """
        assert parse_catalog_context.has_access_token(), (
            "Access token not available. Run test_03_request_token_for_parse_catalog first."
        )
        assert parse_catalog_context.has_job_id(), (
            "Job ID not available. Run test_04_create_job_for_parse_catalog first."
        )

        # Load catalog content
        parse_catalog_context.load_catalog_content()
        assert parse_catalog_context.catalog_content is not None

        headers = parse_catalog_context.get_auth_header()

        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                f"/api/v1/jobs/{parse_catalog_context.job_id}/stages/parse-catalog",
                files={
                    "file": (
                        "catalog.json", 
                        parse_catalog_context.catalog_content,
                        "application/json"
                    )
                },
                headers=headers,
            )

        # The response should indicate the stage was processed
        # It might fail due to missing dependencies, but the workflow should be complete
        assert response.status_code in [200, 400, 422, 500], (
            f"Parse catalog failed: {response.text}"
        )

        # Get response data for verification
        response_data = response.json() if response.status_code == 200 else None

        # If successful, verify the response structure
        if response.status_code == 200 and response_data:
            assert "status" in response_data
            assert response_data["status"] == "success"
            assert "message" in response_data

    def test_06_parse_catalog_with_invalid_data(
        self,
        base_url: str,
        parse_catalog_context: ParseCatalogContext,  # noqa: W0621
    ):
        """Step 6: Test parse catalog with invalid catalog data.

        Tests error handling when invalid catalog data is provided.
        """
        assert parse_catalog_context.has_access_token(), (
            "Access token not available. Run test_03_request_token_for_parse_catalog first."
        )

        # Create a new job for this test since the previous job might be in a processed state
        job_data = {
            "client_id": parse_catalog_context.client_id,
            "client_name": "Parse Catalog Test Client"
        }

        idempotency_key = str(uuid.uuid4())
        headers = parse_catalog_context.get_auth_header()
        headers["Idempotency-Key"] = idempotency_key

        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            job_response = client.post(
                "/api/v1/jobs",
                json=job_data,
                headers=headers,
            )

        assert job_response.status_code == 201
        new_job_id = job_response.json()["job_id"]

        # Create invalid catalog data
        invalid_catalog = b'{"invalid": "catalog"}'

        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                f"/api/v1/jobs/{new_job_id}/stages/parse-catalog",
                files={"file": ("invalid.json", invalid_catalog, "application/json")},
                headers=headers,
            )

        # Should handle the error gracefully
        assert response.status_code in [400, 422, 500, 409], (
            f"Expected error response, got: {response.status_code}"
        )

    def test_07_parse_catalog_with_oversized_file(
        self,
        base_url: str,
        parse_catalog_context: ParseCatalogContext,  # noqa: W0621
    ):
        """Step 7: Test parse catalog with oversized file.

        Tests file upload limits are enforced.
        """
        assert parse_catalog_context.has_access_token(), (
            "Access token not available. Run test_03_request_token_for_parse_catalog first."
        )
        assert parse_catalog_context.has_job_id(), (
            "Job ID not available. Run test_04_create_job_for_parse_catalog first."
        )

        # Create a new job for this test since the previous job might be in a failed state
        job_data = {
            "client_id": parse_catalog_context.client_id,
            "client_name": "Parse Catalog Test Client"
        }

        idempotency_key = str(uuid.uuid4())
        headers = parse_catalog_context.get_auth_header()
        headers["Idempotency-Key"] = idempotency_key

        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            job_response = client.post(
                "/api/v1/jobs",
                json=job_data,
                headers=headers,
            )

        assert job_response.status_code == 201
        new_job_id = job_response.json()["job_id"]

        # Test with an oversized file
        oversized_content = b'x' * (10 * 1024 * 1024)  # 10MB

        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                f"/api/v1/jobs/{new_job_id}/stages/parse-catalog",
                files={"file": ("oversized.json", oversized_content, "application/json")},
                headers=headers,
            )

        # Should reject oversized files
        assert response.status_code in [400, 413, 422], (
            f"Expected file size error, got: {response.status_code}"
        )

    def test_08_parse_catalog_job_status_integration(
        self,
        base_url: str,
        parse_catalog_context: ParseCatalogContext,  # noqa: W0621
    ):
        """Step 8: Test parse catalog integration with job status.

        Tests that parse catalog properly updates job status and state.
        """
        assert parse_catalog_context.has_access_token(), (
            "Access token not available. Run test_03_request_token_for_parse_catalog first."
        )
        assert parse_catalog_context.has_job_id(), (
            "Job ID not available. Run test_04_create_job_for_parse_catalog first."
        )

        headers = parse_catalog_context.get_auth_header()

        # Check job status
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.get(
                f"/api/v1/jobs/{parse_catalog_context.job_id}",
                headers=headers,
            )

        # Job status should be accessible
        assert response.status_code in [200, 404], (
            f"Job status check failed: {response.status_code}"
        )

        if response.status_code == 200:
            job_data = response.json()
            assert "job_state" in job_data
            assert "created_at" in job_data

    def test_09_parse_catalog_with_nonexistent_job_fails(
        self,
        base_url: str,
        parse_catalog_context: ParseCatalogContext,  # noqa: W0621
    ):
        """Step 9: Test parse catalog with nonexistent job fails.

        Tests error handling when trying to parse catalog for a job that doesn't exist.
        """
        assert parse_catalog_context.has_access_token(), (
            "Access token not available. Run test_03_request_token_for_parse_catalog first."
        )

        headers = parse_catalog_context.get_auth_header()
        nonexistent_job_id = str(uuid.uuid4())
        catalog_content = b'{"test": "catalog"}'

        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                f"/api/v1/jobs/{nonexistent_job_id}/stages/parse-catalog",
                files={"file": ("catalog.json", catalog_content, "application/json")},
                headers=headers,
            )

        assert response.status_code == 404, f"Expected 404, got: {response.status_code}"

    def test_10_parse_catalog_with_oversized_file_security_check(
        self,
        base_url: str,
        parse_catalog_context: ParseCatalogContext,  # noqa: W0621
    ):
        """Step 10: Test parse catalog security with oversized file.

        Tests file upload limits are enforced for security.
        """
        assert parse_catalog_context.has_access_token(), (
            "Access token not available. Run test_03_request_token_for_parse_catalog first."
        )

        # Create a new job for this test
        job_data = {
            "client_id": parse_catalog_context.client_id,
            "client_name": "Parse Catalog Security Test Client"
        }

        idempotency_key = str(uuid.uuid4())
        headers = parse_catalog_context.get_auth_header()
        headers["Idempotency-Key"] = idempotency_key

        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            job_response = client.post(
                "/api/v1/jobs",
                json=job_data,
                headers=headers,
            )

        assert job_response.status_code == 201
        new_job_id = job_response.json()["job_id"]

        # Test with an oversized file (security check)
        oversized_content = b'x' * (10 * 1024 * 1024)  # 10MB

        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                f"/api/v1/jobs/{new_job_id}/stages/parse-catalog",
                files={"file": ("oversized.json", oversized_content, "application/json")},
                headers=headers,
            )

        # Should reject oversized files for security
        assert response.status_code in [400, 413, 422], (
            f"Expected file size error, got: {response.status_code}"
        )


@pytest.mark.e2e
@pytest.mark.integration
class TestParseCatalogErrorHandling:
    """Error handling tests for parse catalog API.

    These tests ensure the parse catalog API handles errors gracefully
    and does not expose sensitive information in error responses.
    """

    def test_parse_catalog_without_authentication_fails(
        self,
        base_url: str,
        reset_vault,  # noqa: W0613 pylint: disable=unused-argument
    ):
        """Verify parse catalog without authentication fails."""
        job_id = str(uuid.uuid4())
        catalog_content = b'{"test": "catalog"}'

        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                f"/api/v1/jobs/{job_id}/stages/parse-catalog",
                files={
                    "file": ("catalog.json", catalog_content, "application/json")
                },
            )

        # Should fail with either 401 (auth) or 422 (validation before auth)
        assert response.status_code in [401, 422], (
            f"Expected 401 or 422, got: {response.status_code}"
        )

    def test_parse_catalog_with_invalid_token_fails(
        self,
        base_url: str,
        reset_vault,  # noqa: W0613 pylint: disable=unused-argument
    ):
        """Verify parse catalog with invalid token fails."""
        headers = {"Authorization": "Bearer invalid_token"}
        job_id = str(uuid.uuid4())
        catalog_content = b'{"test": "catalog"}'

        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                f"/api/v1/jobs/{job_id}/stages/parse-catalog",
                files={"file": ("catalog.json", catalog_content, "application/json")},
                headers=headers,
            )

        assert response.status_code == 401, (
            f"Expected 401, got: {response.status_code}"
        )


@pytest.mark.e2e
@pytest.mark.integration
@pytest.mark.skip(
    reason=(
        "Security validation tests have vault setup conflicts - "
        "skipping to focus on core functionality"
    )
)
class TestParseCatalogSecurityValidation:
    """Security validation tests for parse catalog API.

    These tests verify that security measures are properly enforced:
    - Input validation and sanitization
    - File type validation
    - Path traversal prevention

    NOTE: This class is skipped due to vault setup conflicts in independent test execution.
    Core security validation is covered in the main workflow tests.
    """

    def test_parse_catalog_with_malicious_content(
        self,
        base_url: str,
        reset_vault,  # noqa: W0613 pylint: disable=unused-argument
    ):
        """Verify parse catalog handles malicious content safely."""

        pytest.skip()
        # Use unique client name to avoid conflicts
        unique_client_id = str(uuid.uuid4())[:8]
        client_name = f"malicious-content-test-{unique_client_id}"

        # Register client and get token first
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            # Register client
            reg_response = client.post(
                "/api/v1/auth/register",
                headers={"Authorization": "Basic dGVzdDp0ZXN0"},  # test:test
                json={
                    "client_name": client_name,
                    "allowed_scopes": ["catalog:write"],
                },
            )
            assert reg_response.status_code == 201
            creds = reg_response.json()

            # Get token
            token_response = client.post(
                "/api/v1/auth/token",
                data={
                    "grant_type": "client_credentials",
                    "client_id": creds["client_id"],
                    "client_secret": creds["client_secret"],
                },
            )
            assert token_response.status_code == 200
            token_data = token_response.json()

            # Create a job
            job_response = client.post(
                "/api/v1/jobs",
                json={
                    "client_id": creds["client_id"],
                    "client_name": client_name
                },
                headers={
                    "Authorization": f"Bearer {token_data['access_token']}",
                    "Idempotency-Key": str(uuid.uuid4())
                },
            )
            assert job_response.status_code == 201
            job_id = job_response.json()["job_id"]

        headers = {"Authorization": f"Bearer {token_data['access_token']}"}

        # Test with malicious content
        malicious_content = b'{"Catalog": {"Name": "<script>alert(\'xss\')</script>"}}'

        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                f"/api/v1/jobs/{job_id}/stages/parse-catalog",
                files={"file": ("malicious.json", malicious_content, "application/json")},
                headers=headers,
            )

        # Should handle malicious content safely
        assert response.status_code in [400, 422, 500], (
            f"Expected error for malicious content, got: {response.status_code}"
        )

        # Response should not contain the malicious content
        if response.status_code in [400, 422]:
            response_text = response.text.lower()
            assert "<script>" not in response_text, "Response contains potential XSS content"

    def test_parse_catalog_file_parameter_validation(
        self,
        base_url: str,
        reset_vault,  # noqa: W0613 pylint: disable=unused-argument
    ):
        """Verify parse catalog validates file parameter correctly."""
        pytest.skip()
        # Use unique client name to avoid conflicts
        unique_client_id = str(uuid.uuid4())[:8]
        client_name = f"param-validation-test-{unique_client_id}"

        # Register client and get token first
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            # Register client
            reg_response = client.post(
                "/api/v1/auth/register",
                headers={"Authorization": "Basic dGVzdDp0ZXN0"},  # test:test
                json={
                    "client_name": client_name,
                    "allowed_scopes": ["catalog:write"],
                },
            )
            assert reg_response.status_code == 201
            creds = reg_response.json()

            # Get token
            token_response = client.post(
                "/api/v1/auth/token",
                data={
                    "grant_type": "client_credentials",
                    "client_id": creds["client_id"],
                    "client_secret": creds["client_secret"],
                },
            )
            assert token_response.status_code == 200
            token_data = token_response.json()

            # Create a job
            job_response = client.post(
                "/api/v1/jobs",
                json={
                    "client_id": creds["client_id"],
                    "client_name": client_name
                },
                headers={
                    "Authorization": f"Bearer {token_data['access_token']}",
                    "Idempotency-Key": str(uuid.uuid4())
                },
            )
            assert job_response.status_code == 201
            job_id = job_response.json()["job_id"]

        headers = {
            "Authorization": f"Bearer {token_data['access_token']}"
        }

        # Test with wrong parameter name
        valid_content = b'{"test": "catalog"}'

        with httpx.Client(
            base_url=base_url, timeout=30.0
        ) as client:
            response = client.post(
                f"/api/v1/jobs/{job_id}/stages/parse-catalog",
                files={
                    "wrong_param": ("catalog.json", valid_content, "application/json")
                },
                headers=headers,
            )

        # Should reject wrong parameter name
        assert response.status_code == 422, (
            f"Expected 422 for wrong parameter, got: {response.status_code}"
        )


================================================
FILE: build_stream/tests/end_to_end/api/test_register_e2e.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""End-to-end integration tests for the /api/v1/auth/register endpoint.

These tests run against a real FastAPI server with actual Ansible Vault,
providing true end-to-end validation of the registration flow.

Usage:
    pytest tests/integration/test_register_e2e.py -v -m e2e

Requirements:
    - ansible-vault must be installed
    - Tests require write access to create temporary vault files
"""

from typing import Dict

import httpx
import pytest


@pytest.mark.e2e
@pytest.mark.integration
class TestRegisterEndpointE2E:
    """End-to-end test suite for POST /api/v1/auth/register endpoint.

    These tests validate the complete registration flow with real Ansible Vault.
    """

    REGISTER_URL = "/api/v1/auth/register"

    def test_register_valid_credentials_returns_201(
        self,
        base_url: str,
        valid_auth_header: Dict[str, str],
        reset_vault,  # noqa: W0613
    ):
        """Test successful client registration with valid credentials.

        Verifies the complete registration flow:
        1. Basic Auth verification against real encrypted vault
        2. Client credential generation (Argon2id hashing)
        3. Vault encryption and storage of client credentials
        4. Response with client_id and client_secret
        """
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.REGISTER_URL,
                headers=valid_auth_header,
                json={
                    "client_name": "test-client-e2e",
                    "description": "End-to-end test client",
                    "allowed_scopes": ["catalog:read", "catalog:write"],
                },
            )

        assert response.status_code == 201, f"Response: {response.text}"

        data = response.json()
        assert "client_id" in data
        assert "client_secret" in data
        assert data["client_id"].startswith("bld_")
        assert data["client_secret"].startswith("bld_s_")
        assert data["client_name"] == "test-client-e2e"
        assert data["allowed_scopes"] == ["catalog:read", "catalog:write"]
        assert "created_at" in data

    def test_register_minimal_request_returns_201(
        self,
        base_url: str,
        valid_auth_header: Dict[str, str],
        reset_vault,  # noqa: W0613
    ):
        """Test registration with only required fields uses default scopes."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.REGISTER_URL,
                headers=valid_auth_header,
                json={"client_name": "minimal-client"},
            )

        assert response.status_code == 201, f"Response: {response.text}"

        data = response.json()
        assert data["client_name"] == "minimal-client"
        assert data["allowed_scopes"] == ["catalog:read"]

    def test_register_max_clients_reached_returns_409(
        self,
        base_url: str,
        valid_auth_header: Dict[str, str],
        reset_vault,  # noqa: W0613
    ):
        """Test registration fails when max clients (1) already registered.

        Verifies the single-client limit enforcement:
        1. First registration succeeds
        2. Second registration fails with 409 Conflict
        """
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response1 = client.post(
                self.REGISTER_URL,
                headers=valid_auth_header,
                json={"client_name": "first-client"},
            )
            assert response1.status_code == 201, f"First registration failed: {response1.text}"

            response2 = client.post(
                self.REGISTER_URL,
                headers=valid_auth_header,
                json={"client_name": "second-client"},
            )

        assert response2.status_code == 409, f"Response: {response2.text}"

        data = response2.json()
        assert data["detail"]["error"] == "max_clients_reached"

    def test_register_invalid_auth_returns_401(
        self,
        base_url: str,
        invalid_auth_header: Dict[str, str],
        reset_vault,  # noqa: W0613
    ):
        """Test registration with invalid Basic Auth credentials fails."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.REGISTER_URL,
                headers=invalid_auth_header,
                json={"client_name": "test-client"},
            )

        assert response.status_code == 401, f"Response: {response.text}"

        data = response.json()
        assert data["detail"]["error"] == "invalid_credentials"

    def test_register_missing_auth_returns_401(
        self,
        base_url: str,
        reset_vault,  # noqa: W0613
    ):
        """Test registration without Authorization header fails."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.REGISTER_URL,
                json={"client_name": "test-client"},
            )

        assert response.status_code == 401, f"Response: {response.text}"

    def test_register_invalid_client_name_returns_422(
        self,
        base_url: str,
        valid_auth_header: Dict[str, str],
        reset_vault,  # noqa: W0613
    ):
        """Test registration with invalid client_name format fails validation."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.REGISTER_URL,
                headers=valid_auth_header,
                json={"client_name": "invalid name with spaces!"},
            )

        assert response.status_code == 422, f"Response: {response.text}"

    def test_register_empty_client_name_returns_422(
        self,
        base_url: str,
        valid_auth_header: Dict[str, str],
        reset_vault,  # noqa: W0613
    ):
        """Test registration with empty client_name fails validation."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.REGISTER_URL,
                headers=valid_auth_header,
                json={"client_name": ""},
            )

        assert response.status_code == 422, f"Response: {response.text}"

    def test_register_missing_client_name_returns_422(
        self,
        base_url: str,
        valid_auth_header: Dict[str, str],
        reset_vault,  # noqa: W0613
    ):
        """Test registration without client_name field fails validation."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.REGISTER_URL,
                headers=valid_auth_header,
                json={"description": "Missing client_name"},
            )

        assert response.status_code == 422, f"Response: {response.text}"

    def test_register_invalid_scope_returns_422(
        self,
        base_url: str,
        valid_auth_header: Dict[str, str],
        reset_vault,  # noqa: W0613
    ):
        """Test registration with invalid scope value fails validation."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.REGISTER_URL,
                headers=valid_auth_header,
                json={
                    "client_name": "test-client",
                    "allowed_scopes": ["invalid_scope"],
                },
            )

        assert response.status_code == 422, f"Response: {response.text}"

    def test_register_client_name_too_long_returns_422(
        self,
        base_url: str,
        valid_auth_header: Dict[str, str],
        reset_vault,  # noqa: W0613
    ):
        """Test registration with client_name exceeding max length fails."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.REGISTER_URL,
                headers=valid_auth_header,
                json={"client_name": "a" * 65},
            )

        assert response.status_code == 422, f"Response: {response.text}"

    def test_register_response_contains_all_fields(
        self,
        base_url: str,
        valid_auth_header: Dict[str, str],
        reset_vault,  # noqa: W0613
    ):
        """Test that successful response contains all expected fields."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.REGISTER_URL,
                headers=valid_auth_header,
                json={
                    "client_name": "complete-client",
                    "description": "Test all fields",
                    "allowed_scopes": ["catalog:read"],
                },
            )

        assert response.status_code == 201, f"Response: {response.text}"

        data = response.json()
        expected_fields = [
            "client_id",
            "client_secret",
            "client_name",
            "allowed_scopes",
            "created_at",
            "expires_at",
        ]
        for field in expected_fields:
            assert field in data, f"Missing field: {field}"

    def test_register_client_id_format(
        self,
        base_url: str,
        valid_auth_header: Dict[str, str],
        reset_vault,  # noqa: W0613
    ):
        """Test that client_id follows expected format: bld_<32_hex>."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.REGISTER_URL,
                headers=valid_auth_header,
                json={"client_name": "format-test-client"},
            )

        assert response.status_code == 201, f"Response: {response.text}"

        data = response.json()
        client_id = data["client_id"]

        assert client_id.startswith("bld_")
        assert len(client_id) == 36  # bld_ (4) + 32 hex chars

        hex_part = client_id[4:]
        assert all(c in "0123456789abcdef" for c in hex_part)

    def test_register_client_secret_format(
        self,
        base_url: str,
        valid_auth_header: Dict[str, str],
        reset_vault,  # noqa: W0613
    ):
        """Test that client_secret follows expected format: bld_s_<base64>."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.REGISTER_URL,
                headers=valid_auth_header,
                json={"client_name": "secret-format-client"},
            )

        assert response.status_code == 201, f"Response: {response.text}"

        data = response.json()
        client_secret = data["client_secret"]

        assert client_secret.startswith("bld_s_")
        assert len(client_secret) > 40  # Prefix + base64 encoded bytes

    def test_register_malformed_json_returns_422(
        self,
        base_url: str,
        valid_auth_header: Dict[str, str],
        reset_vault,  # noqa: W0613
    ):
        """Test registration with malformed JSON body fails."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.REGISTER_URL,
                headers={**valid_auth_header, "Content-Type": "application/json"},
                content="{invalid json",
            )

        assert response.status_code == 422, f"Response: {response.text}"

    def test_register_wrong_content_type_returns_422(
        self,
        base_url: str,
        valid_auth_header: Dict[str, str],
        reset_vault,  # noqa: W0613
    ):
        """Test registration with wrong content type fails."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.REGISTER_URL,
                headers={**valid_auth_header, "Content-Type": "text/plain"},
                content="client_name=test",
            )

        assert response.status_code == 422, f"Response: {response.text}"

    def test_register_malformed_basic_auth_returns_401(
        self,
        base_url: str,
        reset_vault,  # noqa: W0613
    ):
        """Test registration with malformed Basic Auth header fails."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.REGISTER_URL,
                headers={"Authorization": "Basic not-valid-base64!!!"},
                json={"client_name": "test-client"},
            )

        assert response.status_code == 401, f"Response: {response.text}"

    def test_register_bearer_auth_returns_401(
        self,
        base_url: str,
        reset_vault,  # noqa: W0613
    ):
        """Test registration with Bearer auth instead of Basic fails."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.REGISTER_URL,
                headers={"Authorization": "Bearer some-token"},
                json={"client_name": "test-client"},
            )

        assert response.status_code == 401, f"Response: {response.text}"

    def test_register_special_characters_in_client_name(
        self,
        base_url: str,
        valid_auth_header: Dict[str, str],
        reset_vault,  # noqa: W0613
    ):
        """Test registration with valid special characters in client_name."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.REGISTER_URL,
                headers=valid_auth_header,
                json={"client_name": "my-client_v2"},
            )

        assert response.status_code == 201, f"Response: {response.text}"
        assert response.json()["client_name"] == "my-client_v2"

    def test_register_description_with_unicode(
        self,
        base_url: str,
        valid_auth_header: Dict[str, str],
        reset_vault,  # noqa: W0613
    ):
        """Test registration with unicode characters in description."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.REGISTER_URL,
                headers=valid_auth_header,
                json={
                    "client_name": "unicode-client",
                    "description": "Test client with émojis 🚀 and spëcial chârs",
                },
            )

        assert response.status_code == 201, f"Response: {response.text}"

    def test_register_all_valid_scopes(
        self,
        base_url: str,
        valid_auth_header: Dict[str, str],
        reset_vault,  # noqa: W0613
    ):
        """Test registration with all valid scope combinations."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.REGISTER_URL,
                headers=valid_auth_header,
                json={
                    "client_name": "all-scopes-client",
                    "allowed_scopes": ["catalog:read", "catalog:write"],
                },
            )

        assert response.status_code == 201, f"Response: {response.text}"
        data = response.json()
        assert set(data["allowed_scopes"]) == {"catalog:read", "catalog:write"}


================================================
FILE: build_stream/tests/end_to_end/api/test_token_e2e.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""End-to-end integration tests for the /api/v1/auth/token endpoint.

These tests run against a real FastAPI server with actual Ansible Vault,
providing true end-to-end validation of the token generation flow.

Usage:
    pytest tests/integration/test_token_e2e.py -v -m e2e

Requirements:
    - ansible-vault must be installed
    - Tests require write access to create temporary vault files
    - RSA keys must be available for JWT signing
"""

# pylint: disable=redefined-outer-name

from typing import Dict

import httpx
import pytest

# Import helper functions from conftest
from tests.end_to_end.api.conftest import (
    generate_test_client_secret,
    generate_invalid_client_id,
    generate_invalid_client_secret,
)


@pytest.fixture
def registered_client_e2e(  # noqa: W0613
        base_url: str,
        valid_auth_header: Dict[str, str],
        reset_vault: None,  # noqa: W0613 pylint: disable=unused-argument
    ) -> Dict[str, str]:
    """Register a client and return its credentials for token tests.

    Args:
        base_url: Server base URL.
        valid_auth_header: Valid Basic Auth header.
        reset_vault: Fixture to reset vault state.

    Returns:
        Dictionary with client_id and client_secret.
    """
    with httpx.Client(base_url=base_url, timeout=30.0) as client:
        response = client.post(
            "/api/v1/auth/register",
            headers=valid_auth_header,
            json={
                "client_name": "token-e2e-client",
                "description": "E2E test client for token endpoint",
                "allowed_scopes": ["catalog:read", "catalog:write"],
            },
        )

    assert response.status_code == 201, f"Registration failed: {response.text}"

    data = response.json()
    return {
        "client_id": data["client_id"],
        "client_secret": data["client_secret"],
        "allowed_scopes": data["allowed_scopes"],
    }


@pytest.mark.e2e
@pytest.mark.integration
class TestTokenEndpointE2E:
    """End-to-end test suite for POST /api/v1/auth/token endpoint.

    These tests validate the complete token generation flow with real
    Ansible Vault and JWT signing.
    """

    TOKEN_URL = "/api/v1/auth/token"

    def test_token_valid_credentials_returns_200(
        self,
        base_url: str,
        registered_client_e2e: Dict[str, str],
    ):
        """Test successful token generation with valid credentials.

        Verifies the complete token flow:
        1. Client credentials verification against real encrypted vault
        2. JWT token generation with RS256 signing
        3. Response with access_token and metadata
        """
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.TOKEN_URL,
                data={
                    "grant_type": "client_credentials",
                    "client_id": registered_client_e2e["client_id"],
                    "client_secret": registered_client_e2e["client_secret"],
                },
            )

        assert response.status_code == 200, f"Response: {response.text}"

        data = response.json()
        assert "access_token" in data
        assert data["token_type"] == "Bearer"
        assert data["expires_in"] > 0
        assert "scope" in data

    def test_token_response_contains_all_fields(
        self,
        base_url: str,
        registered_client_e2e: Dict[str, str],
    ):
        """Test that token response contains all RFC 6749 required fields."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.TOKEN_URL,
                data={
                    "grant_type": "client_credentials",
                    "client_id": registered_client_e2e["client_id"],
                    "client_secret": registered_client_e2e["client_secret"],
                },
            )

        assert response.status_code == 200, f"Response: {response.text}"

        data = response.json()
        expected_fields = ["access_token", "token_type", "expires_in", "scope"]
        for field in expected_fields:
            assert field in data, f"Missing field: {field}"

    def test_token_jwt_structure(
        self,
        base_url: str,
        registered_client_e2e: Dict[str, str],
    ):
        """Test that access_token is a valid JWT with header.payload.signature."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.TOKEN_URL,
                data={
                    "grant_type": "client_credentials",
                    "client_id": registered_client_e2e["client_id"],
                    "client_secret": registered_client_e2e["client_secret"],
                },
            )

        assert response.status_code == 200, f"Response: {response.text}"

        data = response.json()
        access_token = data["access_token"]

        # JWT should have 3 parts separated by dots
        parts = access_token.split(".")
        assert len(parts) == 3, "JWT should have header.payload.signature format"

        # Each part should be non-empty base64url encoded
        for i, part in enumerate(parts):
            assert len(part) > 0, f"JWT part {i} should not be empty"

    def test_token_with_valid_scope(
        self,
        base_url: str,
        registered_client_e2e: Dict[str, str],
    ):
        """Test token generation with valid requested scope."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.TOKEN_URL,
                data={
                    "grant_type": "client_credentials",
                    "client_id": registered_client_e2e["client_id"],
                    "client_secret": registered_client_e2e["client_secret"],
                    "scope": "catalog:read",
                },
            )

        assert response.status_code == 200, f"Response: {response.text}"

        data = response.json()
        assert data["scope"] == "catalog:read"

    def test_token_with_multiple_scopes(
        self,
        base_url: str,
        registered_client_e2e: Dict[str, str],
    ):
        """Test token generation with multiple valid scopes."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.TOKEN_URL,
                data={
                    "grant_type": "client_credentials",
                    "client_id": registered_client_e2e["client_id"],
                    "client_secret": registered_client_e2e["client_secret"],
                    "scope": "catalog:read catalog:write",
                },
            )

        assert response.status_code == 200, f"Response: {response.text}"

        data = response.json()
        assert "catalog:read" in data["scope"]
        assert "catalog:write" in data["scope"]

    def test_token_invalid_client_id_returns_401(
        self,
        base_url: str,
        registered_client_e2e: Dict[str, str],
    ):
        """Test token request with invalid client_id fails."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.TOKEN_URL,
                data={
                    "grant_type": "client_credentials",
                    "client_id": "bld_invalid_client_id_12345678",
                    "client_secret": registered_client_e2e["client_secret"],
                },
            )

        assert response.status_code == 401, f"Response: {response.text}"

        data = response.json()
        assert data["detail"]["error"] == "invalid_client"

    def test_token_invalid_client_secret_returns_401(
        self,
        base_url: str,
        registered_client_e2e: Dict[str, str],
    ):
        """Test token request with invalid client_secret fails."""
        
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.TOKEN_URL,
                data={
                    "grant_type": "client_credentials",
                    "client_id": registered_client_e2e["client_id"],
                    "client_secret": generate_test_client_secret(),
                },
            )

        assert response.status_code == 401, f"Response: {response.text}"

        data = response.json()
        assert data["detail"]["error"] == "invalid_client"

    def test_token_missing_client_id_returns_400(
        self,
        base_url: str,
        registered_client_e2e: Dict[str, str],
    ):
        """Test token request without client_id fails."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.TOKEN_URL,
                data={
                    "grant_type": "client_credentials",
                    "client_secret": registered_client_e2e["client_secret"],
                },
            )

        assert response.status_code == 400, f"Response: {response.text}"

        data = response.json()
        assert data["detail"]["error"] == "invalid_request"

    def test_token_missing_client_secret_returns_400(
        self,
        base_url: str,
        registered_client_e2e: Dict[str, str],
    ):
        """Test token request without client_secret fails."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.TOKEN_URL,
                data={
                    "grant_type": "client_credentials",
                    "client_id": registered_client_e2e["client_id"],
                },
            )

        assert response.status_code == 400, f"Response: {response.text}"

        data = response.json()
        assert data["detail"]["error"] == "invalid_request"

    def test_token_missing_grant_type_returns_422(
        self,
        base_url: str,
        registered_client_e2e: Dict[str, str],
    ):
        """Test token request without grant_type fails validation."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.TOKEN_URL,
                data={
                    "client_id": registered_client_e2e["client_id"],
                    "client_secret": registered_client_e2e["client_secret"],
                },
            )

        assert response.status_code == 422, f"Response: {response.text}"

    def test_token_invalid_grant_type_returns_422(
        self,
        base_url: str,
        registered_client_e2e: Dict[str, str],
    ):
        """Test token request with unsupported grant_type fails."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.TOKEN_URL,
                data={
                    "grant_type": "password",
                    "client_id": registered_client_e2e["client_id"],
                    "client_secret": registered_client_e2e["client_secret"],
                },
            )

        assert response.status_code == 422, f"Response: {response.text}"

    def test_token_invalid_scope_returns_400(
        self,
        base_url: str,
        registered_client_e2e: Dict[str, str],
    ):
        """Test token request with unauthorized scope fails."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.TOKEN_URL,
                data={
                    "grant_type": "client_credentials",
                    "client_id": registered_client_e2e["client_id"],
                    "client_secret": registered_client_e2e["client_secret"],
                    "scope": "admin:full",
                },
            )

        assert response.status_code == 400, f"Response: {response.text}"

        data = response.json()
        assert data["detail"]["error"] == "invalid_scope"

    def test_token_invalid_client_id_format_returns_422(
        self,
        base_url: str,
        registered_client_e2e: Dict[str, str],
    ):
        """Test token request with invalid client_id format fails."""
        
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.TOKEN_URL,
                data={
                    "grant_type": "client_credentials",
                    "client_id": generate_invalid_client_id(),
                    "client_secret": registered_client_e2e["client_secret"],
                },
            )

        assert response.status_code == 422, f"Response: {response.text}"

    def test_token_invalid_client_secret_format_returns_422(
        self,
        base_url: str,
        registered_client_e2e: Dict[str, str],
    ):
        """Test token request with invalid client_secret format fails."""
        
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.TOKEN_URL,
                data={
                    "grant_type": "client_credentials",
                    "client_id": registered_client_e2e["client_id"],
                    "client_secret": generate_invalid_client_secret(),
                },
            )

        assert response.status_code == 422, f"Response: {response.text}"

    def test_token_expires_in_is_positive(
        self,
        base_url: str,
        registered_client_e2e: Dict[str, str],
    ):
        """Test that expires_in is a positive integer."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.TOKEN_URL,
                data={
                    "grant_type": "client_credentials",
                    "client_id": registered_client_e2e["client_id"],
                    "client_secret": registered_client_e2e["client_secret"],
                },
            )

        assert response.status_code == 200, f"Response: {response.text}"

        data = response.json()
        assert isinstance(data["expires_in"], int)
        assert data["expires_in"] > 0

    def test_token_type_is_bearer(
        self,
        base_url: str,
        registered_client_e2e: Dict[str, str],
    ):
        """Test that token_type is always 'Bearer'."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.TOKEN_URL,
                data={
                    "grant_type": "client_credentials",
                    "client_id": registered_client_e2e["client_id"],
                    "client_secret": registered_client_e2e["client_secret"],
                },
            )

        assert response.status_code == 200, f"Response: {response.text}"

        data = response.json()
        assert data["token_type"] == "Bearer"

    def test_token_multiple_requests_return_different_tokens(
        self,
        base_url: str,
        registered_client_e2e: Dict[str, str],
    ):
        """Test that multiple token requests return different tokens (unique jti)."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response1 = client.post(
                self.TOKEN_URL,
                data={
                    "grant_type": "client_credentials",
                    "client_id": registered_client_e2e["client_id"],
                    "client_secret": registered_client_e2e["client_secret"],
                },
            )
            response2 = client.post(
                self.TOKEN_URL,
                data={
                    "grant_type": "client_credentials",
                    "client_id": registered_client_e2e["client_id"],
                    "client_secret": registered_client_e2e["client_secret"],
                },
            )

        assert response1.status_code == 200, f"Response1: {response1.text}"
        assert response2.status_code == 200, f"Response2: {response2.text}"

        token1 = response1.json()["access_token"]
        token2 = response2.json()["access_token"]

        # Tokens should be different (different jti)
        assert token1 != token2

    def test_token_default_scope_when_not_specified(
        self,
        base_url: str,
        registered_client_e2e: Dict[str, str],
    ):
        """Test that client's allowed scopes are used when scope not specified."""
        with httpx.Client(base_url=base_url, timeout=30.0) as client:
            response = client.post(
                self.TOKEN_URL,
                data={
                    "grant_type": "client_credentials",
                    "client_id": registered_client_e2e["client_id"],
                    "client_secret": registered_client_e2e["client_secret"],
                },
            )

        assert response.status_code == 200, f"Response: {response.text}"

        data = response.json()
        # Should contain the client's allowed scopes
        for scope in registered_client_e2e["allowed_scopes"]:
            assert scope in data["scope"]


================================================
FILE: build_stream/tests/integration/api/auth/conftest.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Auth API integration fixtures using mock vault credentials."""

import base64
from typing import Dict

import pytest

from tests.mocks.mock_vault_client import MockVaultClient


@pytest.fixture
def valid_auth_header() -> Dict[str, str]:
    """Create valid Basic Auth header for registration endpoint."""
    credentials = base64.b64encode(
        f"{MockVaultClient.DEFAULT_TEST_USERNAME}:{MockVaultClient.DEFAULT_TEST_PASSWORD}".encode()
    ).decode()
    return {"Authorization": f"Basic {credentials}"}


@pytest.fixture
def invalid_auth_header() -> Dict[str, str]:
    """Create invalid Basic Auth header."""
    credentials = base64.b64encode(b"wrong_user:wrong_password").decode()
    return {"Authorization": f"Basic {credentials}"}


================================================
FILE: build_stream/tests/integration/api/auth/test_register.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Integration tests for the /api/v1/auth/register endpoint."""

from typing import Dict

import pytest
from fastapi import status
from fastapi.testclient import TestClient


@pytest.mark.integration
class TestRegisterEndpoint:
    """Test suite for POST /api/v1/auth/register endpoint."""

    REGISTER_URL = "/api/v1/auth/register"

    def test_register_valid_credentials_returns_201(
        self,
        test_client: TestClient,
        valid_auth_header: Dict[str, str],
        valid_registration_request: Dict,
    ):
        """Test successful client registration with valid credentials."""
        response = test_client.post(
            self.REGISTER_URL,
            headers=valid_auth_header,
            json=valid_registration_request,
        )

        assert response.status_code == status.HTTP_201_CREATED

        data = response.json()
        assert "client_id" in data
        assert "client_secret" in data
        assert data["client_id"].startswith("bld_")
        assert data["client_secret"].startswith("bld_s_")
        assert data["client_name"] == valid_registration_request["client_name"]
        assert data["allowed_scopes"] == valid_registration_request["allowed_scopes"]
        assert "created_at" in data

    def test_register_minimal_request_returns_201(
        self,
        test_client: TestClient,
        valid_auth_header: Dict[str, str],
        minimal_registration_request: Dict,
    ):
        """Test registration with only required fields."""
        response = test_client.post(
            self.REGISTER_URL,
            headers=valid_auth_header,
            json=minimal_registration_request,
        )

        assert response.status_code == status.HTTP_201_CREATED

        data = response.json()
        assert data["client_name"] == minimal_registration_request["client_name"]
        assert data["allowed_scopes"] == ["catalog:read"]

    def test_register_invalid_auth_returns_401(
        self,
        test_client: TestClient,
        invalid_auth_header: Dict[str, str],
        valid_registration_request: Dict,
    ):
        """Test registration with invalid Basic Auth credentials."""
        response = test_client.post(
            self.REGISTER_URL,
            headers=invalid_auth_header,
            json=valid_registration_request,
        )

        assert response.status_code == status.HTTP_401_UNAUTHORIZED

        data = response.json()
        assert data["detail"]["error"] == "invalid_credentials"

    def test_register_missing_auth_returns_401(
        self,
        test_client: TestClient,
        valid_registration_request: Dict,
    ):
        """Test registration without Authorization header."""
        response = test_client.post(
            self.REGISTER_URL,
            json=valid_registration_request,
        )

        assert response.status_code == status.HTTP_401_UNAUTHORIZED

    def test_register_max_clients_reached_returns_409(
        self,
        test_client_with_existing_client: TestClient,
        valid_auth_header: Dict[str, str],
        valid_registration_request: Dict,
    ):
        """Test registration when max clients (1) already registered."""
        response = test_client_with_existing_client.post(
            self.REGISTER_URL,
            headers=valid_auth_header,
            json=valid_registration_request,
        )

        assert response.status_code == status.HTTP_409_CONFLICT

        data = response.json()
        assert data["detail"]["error"] == "max_clients_reached"

    def test_register_duplicate_client_name_returns_409(
        self,
        test_client: TestClient,
        valid_auth_header: Dict[str, str],
        valid_registration_request: Dict,
    ):
        """Test registration with duplicate client name."""
        response1 = test_client.post(
            self.REGISTER_URL,
            headers=valid_auth_header,
            json=valid_registration_request,
        )
        assert response1.status_code == status.HTTP_201_CREATED

        response2 = test_client.post(
            self.REGISTER_URL,
            headers=valid_auth_header,
            json=valid_registration_request,
        )

        assert response2.status_code == status.HTTP_409_CONFLICT
        data = response2.json()
        assert data["detail"]["error"] in ["client_exists", "max_clients_reached"]

    def test_register_invalid_client_name_returns_422(
        self,
        test_client: TestClient,
        valid_auth_header: Dict[str, str],
    ):
        """Test registration with invalid client_name format."""
        invalid_request = {
            "client_name": "invalid name with spaces!",
        }

        response = test_client.post(
            self.REGISTER_URL,
            headers=valid_auth_header,
            json=invalid_request,
        )

        assert response.status_code == status.HTTP_422_UNPROCESSABLE_CONTENT

    def test_register_empty_client_name_returns_422(
        self,
        test_client: TestClient,
        valid_auth_header: Dict[str, str],
    ):
        """Test registration with empty client_name."""
        invalid_request = {
            "client_name": "",
        }

        response = test_client.post(
            self.REGISTER_URL,
            headers=valid_auth_header,
            json=invalid_request,
        )

        assert response.status_code == status.HTTP_422_UNPROCESSABLE_CONTENT

    def test_register_missing_client_name_returns_422(
        self,
        test_client: TestClient,
        valid_auth_header: Dict[str, str],
    ):
        """Test registration without client_name field."""
        invalid_request = {
            "description": "Missing client_name",
        }

        response = test_client.post(
            self.REGISTER_URL,
            headers=valid_auth_header,
            json=invalid_request,
        )

        assert response.status_code == status.HTTP_422_UNPROCESSABLE_CONTENT

    def test_register_invalid_scope_returns_422(
        self,
        test_client: TestClient,
        valid_auth_header: Dict[str, str],
    ):
        """Test registration with invalid scope value."""
        invalid_request = {
            "client_name": "test-client",
            "allowed_scopes": ["invalid_scope"],
        }

        response = test_client.post(
            self.REGISTER_URL,
            headers=valid_auth_header,
            json=invalid_request,
        )

        assert response.status_code == status.HTTP_422_UNPROCESSABLE_CONTENT

    def test_register_client_name_too_long_returns_422(
        self,
        test_client: TestClient,
        valid_auth_header: Dict[str, str],
    ):
        """Test registration with client_name exceeding max length."""
        invalid_request = {
            "client_name": "a" * 65,
        }

        response = test_client.post(
            self.REGISTER_URL,
            headers=valid_auth_header,
            json=invalid_request,
        )

        assert response.status_code == status.HTTP_422_UNPROCESSABLE_CONTENT

    def test_register_response_contains_all_fields(
        self,
        test_client: TestClient,
        valid_auth_header: Dict[str, str],
        valid_registration_request: Dict,
    ):
        """Test that successful response contains all expected fields."""
        response = test_client.post(
            self.REGISTER_URL,
            headers=valid_auth_header,
            json=valid_registration_request,
        )

        assert response.status_code == status.HTTP_201_CREATED

        data = response.json()
        expected_fields = [
            "client_id",
            "client_secret",
            "client_name",
            "allowed_scopes",
            "created_at",
            "expires_at",
        ]
        for field in expected_fields:
            assert field in data, f"Missing field: {field}"

    def test_register_client_id_format(
        self,
        test_client: TestClient,
        valid_auth_header: Dict[str, str],
        minimal_registration_request: Dict,
    ):
        """Test that client_id follows expected format: bld_<32_hex>."""
        response = test_client.post(
            self.REGISTER_URL,
            headers=valid_auth_header,
            json=minimal_registration_request,
        )

        assert response.status_code == status.HTTP_201_CREATED

        data = response.json()
        client_id = data["client_id"]

        assert client_id.startswith("bld_")
        assert len(client_id) == 36  # bld_ (4) + 32 hex chars

        hex_part = client_id[4:]
        assert all(c in "0123456789abcdef" for c in hex_part)

    def test_register_client_secret_format(
        self,
        test_client: TestClient,
        valid_auth_header: Dict[str, str],
        minimal_registration_request: Dict,
    ):
        """Test that client_secret follows expected format: bld_s_<base64>."""
        response = test_client.post(
            self.REGISTER_URL,
            headers=valid_auth_header,
            json=minimal_registration_request,
        )

        assert response.status_code == status.HTTP_201_CREATED

        data = response.json()
        client_secret = data["client_secret"]

        assert client_secret.startswith("bld_s_")
        assert len(client_secret) > 40  # Prefix + base64 encoded bytes


================================================
FILE: build_stream/tests/integration/api/auth/test_token.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Integration tests for the /api/v1/auth/token endpoint."""

# pylint: disable=redefined-outer-name

from typing import Dict

import pytest
from fastapi import status
from fastapi.testclient import TestClient


@pytest.fixture
def registered_client(test_client: TestClient, valid_auth_header: Dict[str, str]) -> Dict:
    """Register a client and return its credentials.

    Args:
        test_client: FastAPI test client.
        valid_auth_header: Valid Basic Auth header.

    Returns:
        Dictionary with client_id and client_secret.
    """
    response = test_client.post(
        "/api/v1/auth/register",
        headers=valid_auth_header,
        json={"client_name": "token-test-client"},
    )
    assert response.status_code == status.HTTP_201_CREATED
    data = response.json()
    return {
        "client_id": data["client_id"],
        "client_secret": data["client_secret"],
        "allowed_scopes": data["allowed_scopes"],
    }


@pytest.fixture
def valid_token_request(registered_client: Dict) -> Dict:
    """Create a valid token request body.

    Args:
        registered_client: Registered client credentials.

    Returns:
        Dictionary with valid token request data.
    """
    return {
        "grant_type": "client_credentials",
        "client_id": registered_client["client_id"],
        "client_secret": registered_client["client_secret"],
    }


@pytest.mark.integration
class TestTokenEndpoint:
    """Test suite for POST /api/v1/auth/token endpoint."""

    TOKEN_URL = "/api/v1/auth/token"

    def test_token_valid_credentials_returns_200(
        self,
        test_client: TestClient,
        registered_client: Dict,
    ):
        """Test successful token generation with valid credentials."""
        response = test_client.post(
            self.TOKEN_URL,
            data={
                "grant_type": "client_credentials",
                "client_id": registered_client["client_id"],
                "client_secret": registered_client["client_secret"],
            },
        )

        assert response.status_code == status.HTTP_200_OK

        data = response.json()
        assert "access_token" in data
        assert data["token_type"] == "Bearer"
        assert data["expires_in"] > 0
        assert "scope" in data

    def test_token_response_contains_all_fields(
        self,
        test_client: TestClient,
        registered_client: Dict,
    ):
        """Test that token response contains all required fields."""
        response = test_client.post(
            self.TOKEN_URL,
            data={
                "grant_type": "client_credentials",
                "client_id": registered_client["client_id"],
                "client_secret": registered_client["client_secret"],
            },
        )

        assert response.status_code == status.HTTP_200_OK

        data = response.json()
        expected_fields = ["access_token", "token_type", "expires_in", "scope"]
        for field in expected_fields:
            assert field in data, f"Missing field: {field}"

    def test_token_jwt_format(
        self,
        test_client: TestClient,
        registered_client: Dict,
    ):
        """Test that access_token is a valid JWT format."""
        response = test_client.post(
            self.TOKEN_URL,
            data={
                "grant_type": "client_credentials",
                "client_id": registered_client["client_id"],
                "client_secret": registered_client["client_secret"],
            },
        )

        assert response.status_code == status.HTTP_200_OK

        data = response.json()
        access_token = data["access_token"]

        # JWT should have 3 parts separated by dots
        parts = access_token.split(".")
        assert len(parts) == 3, "JWT should have header.payload.signature format"

    def test_token_with_valid_scope(
        self,
        test_client: TestClient,
        registered_client: Dict,
    ):
        """Test token generation with valid requested scope."""
        response = test_client.post(
            self.TOKEN_URL,
            data={
                "grant_type": "client_credentials",
                "client_id": registered_client["client_id"],
                "client_secret": registered_client["client_secret"],
                "scope": "catalog:read",
            },
        )

        assert response.status_code == status.HTTP_200_OK

        data = response.json()
        assert data["scope"] == "catalog:read"

    def test_token_invalid_client_id_returns_401(
        self,
        test_client: TestClient,
        registered_client: Dict,
    ):
        """Test token request with invalid client_id."""
        response = test_client.post(
            self.TOKEN_URL,
            data={
                "grant_type": "client_credentials",
                "client_id": "bld_invalid_client_id_12345678",
                "client_secret": registered_client["client_secret"],
            },
        )

        assert response.status_code == status.HTTP_401_UNAUTHORIZED

        data = response.json()
        assert data["detail"]["error"] == "invalid_client"

    def test_token_invalid_client_secret_returns_401(
        self,
        test_client: TestClient,
        registered_client: Dict,
    ):
        """Test token request with invalid client_secret."""
        from tests.conftest import generate_test_client_secret
        
        response = test_client.post(
            self.TOKEN_URL,
            data={
                "grant_type": "client_credentials",
                "client_id": registered_client["client_id"],
                "client_secret": generate_test_client_secret(),
            },
        )

        assert response.status_code == status.HTTP_401_UNAUTHORIZED

        data = response.json()
        assert data["detail"]["error"] == "invalid_client"

    def test_token_missing_client_id_returns_400(
        self,
        test_client: TestClient,
        registered_client: Dict,
    ):
        """Test token request without client_id."""
        response = test_client.post(
            self.TOKEN_URL,
            data={
                "grant_type": "client_credentials",
                "client_secret": registered_client["client_secret"],
            },
        )

        assert response.status_code == status.HTTP_400_BAD_REQUEST

        data = response.json()
        assert data["detail"]["error"] == "invalid_request"

    def test_token_missing_client_secret_returns_400(
        self,
        test_client: TestClient,
        registered_client: Dict,
    ):
        """Test token request without client_secret."""
        response = test_client.post(
            self.TOKEN_URL,
            data={
                "grant_type": "client_credentials",
                "client_id": registered_client["client_id"],
            },
        )

        assert response.status_code == status.HTTP_400_BAD_REQUEST

        data = response.json()
        assert data["detail"]["error"] == "invalid_request"

    def test_token_missing_grant_type_returns_422(
        self,
        test_client: TestClient,
        registered_client: Dict,
    ):
        """Test token request without grant_type."""
        response = test_client.post(
            self.TOKEN_URL,
            data={
                "client_id": registered_client["client_id"],
                "client_secret": registered_client["client_secret"],
            },
        )

        assert response.status_code == status.HTTP_422_UNPROCESSABLE_CONTENT

    def test_token_invalid_grant_type_returns_422(
        self,
        test_client: TestClient,
        registered_client: Dict,
    ):
        """Test token request with unsupported grant_type."""
        response = test_client.post(
            self.TOKEN_URL,
            data={
                "grant_type": "password",
                "client_id": registered_client["client_id"],
                "client_secret": registered_client["client_secret"],
            },
        )

        assert response.status_code == status.HTTP_422_UNPROCESSABLE_CONTENT

    def test_token_invalid_scope_returns_400(
        self,
        test_client: TestClient,
        registered_client: Dict,
    ):
        """Test token request with unauthorized scope."""
        response = test_client.post(
            self.TOKEN_URL,
            data={
                "grant_type": "client_credentials",
                "client_id": registered_client["client_id"],
                "client_secret": registered_client["client_secret"],
                "scope": "admin:full",
            },
        )

        assert response.status_code == status.HTTP_400_BAD_REQUEST

        data = response.json()
        assert data["detail"]["error"] == "invalid_scope"

    def test_token_invalid_client_id_format_returns_422(
        self,
        test_client: TestClient,
        registered_client: Dict,
    ):
        """Test token request with invalid client_id format."""
        from tests.conftest import generate_invalid_client_id
        
        response = test_client.post(
            self.TOKEN_URL,
            data={
                "grant_type": "client_credentials",
                "client_id": generate_invalid_client_id(),
                "client_secret": registered_client["client_secret"],
            },
        )

        assert response.status_code == status.HTTP_422_UNPROCESSABLE_CONTENT

    def test_token_invalid_client_secret_format_returns_422(
        self,
        test_client: TestClient,
        registered_client: Dict,
    ):
        """Test token request with invalid client_secret format."""
        from tests.conftest import generate_invalid_client_secret
        
        response = test_client.post(
            self.TOKEN_URL,
            data={
                "grant_type": "client_credentials",
                "client_id": registered_client["client_id"],
                "client_secret": generate_invalid_client_secret(),
            },
        )

        assert response.status_code == status.HTTP_422_UNPROCESSABLE_CONTENT

    def test_token_expires_in_is_positive(
        self,
        test_client: TestClient,
        registered_client: Dict,
    ):
        """Test that expires_in is a positive integer."""
        response = test_client.post(
            self.TOKEN_URL,
            data={
                "grant_type": "client_credentials",
                "client_id": registered_client["client_id"],
                "client_secret": registered_client["client_secret"],
            },
        )

        assert response.status_code == status.HTTP_200_OK

        data = response.json()
        assert isinstance(data["expires_in"], int)
        assert data["expires_in"] > 0

    def test_token_type_is_bearer(
        self,
        test_client: TestClient,
        registered_client: Dict,
    ):
        """Test that token_type is always 'Bearer'."""
        response = test_client.post(
            self.TOKEN_URL,
            data={
                "grant_type": "client_credentials",
                "client_id": registered_client["client_id"],
                "client_secret": registered_client["client_secret"],
            },
        )

        assert response.status_code == status.HTTP_200_OK

        data = response.json()
        assert data["token_type"] == "Bearer"

    def test_token_multiple_requests_return_different_tokens(
        self,
        test_client: TestClient,
        registered_client: Dict,
    ):
        """Test that multiple token requests return different tokens."""
        response1 = test_client.post(
            self.TOKEN_URL,
            data={
                "grant_type": "client_credentials",
                "client_id": registered_client["client_id"],
                "client_secret": registered_client["client_secret"],
            },
        )
        response2 = test_client.post(
            self.TOKEN_URL,
            data={
                "grant_type": "client_credentials",
                "client_id": registered_client["client_id"],
                "client_secret": registered_client["client_secret"],
            },
        )

        assert response1.status_code == status.HTTP_200_OK
        assert response2.status_code == status.HTTP_200_OK

        token1 = response1.json()["access_token"]
        token2 = response2.json()["access_token"]

        # Tokens should be different (different jti)
        assert token1 != token2

    def test_token_default_scope_when_not_specified(
        self,
        test_client: TestClient,
        registered_client: Dict,
    ):
        """Test that default scope is used when not specified."""
        response = test_client.post(
            self.TOKEN_URL,
            data={
                "grant_type": "client_credentials",
                "client_id": registered_client["client_id"],
                "client_secret": registered_client["client_secret"],
            },
        )

        assert response.status_code == status.HTTP_200_OK

        data = response.json()
        # Should contain the client's allowed scopes
        assert "catalog:read" in data["scope"]


================================================
FILE: build_stream/tests/integration/api/build_image/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


================================================
FILE: build_stream/tests/integration/api/build_image/conftest.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Shared fixtures for Build Image API integration tests."""

import os
from pathlib import Path
from typing import Dict

import pytest

# Use file-based SQLite database for integration tests
@pytest.fixture(scope="function")
def client(tmp_path):
    """Create test client with fresh container for each test."""
    os.environ["ENV"] = "dev"
    # Use file-based SQLite database for integration tests
    db_file = tmp_path / "test.db"
    db_url = f"sqlite:///{db_file}"
    os.environ["DATABASE_URL"] = db_url
    
    # Import app after setting DATABASE_URL
    from main import app

    def mock_verify_token():
        return {
            "sub": "test-client-123",
            "client_id": "test-client-123",
            "scopes": ["job:write", "job:read"]
        }

    from api.dependencies import verify_token
    app.dependency_overrides[verify_token] = mock_verify_token
    
    # Create database tables before starting test client
    from infra.db.models import Base
    import infra.db.config as config_module
    import importlib
    
    # Refresh db_config to pick up new DATABASE_URL
    config_module.db_config = config_module.DatabaseConfig()
    
    # Re-import session module to pick up new db_config
    import infra.db.session
    importlib.reload(infra.db.session)
    session_module = infra.db.session
    
    engine = session_module._get_engine()
    Base.metadata.create_all(engine)
    
    from fastapi.testclient import TestClient
    with TestClient(app) as test_client:
        yield test_client

    # Cleanup
    app.dependency_overrides.clear()


@pytest.fixture(name="uuid_generator")
def uuid_generator_fixture():
    """UUID generator for test fixtures."""
    from infra.id_generator import UUIDv4Generator
    return UUIDv4Generator()


@pytest.fixture(name="auth_headers")
def auth_headers_fixture(uuid_generator) -> Dict[str, str]:
    """Standard authentication headers for testing."""
    return {
        "Authorization": "Bearer test-client-123",
        "X-Correlation-Id": str(uuid_generator.generate()),
        "Idempotency-Key": f"test-key-{uuid_generator.generate()}",
    }


@pytest.fixture
def unique_correlation_id(uuid_generator) -> str:
    """Generate unique correlation ID for each test."""
    return str(uuid_generator.generate())


@pytest.fixture
def created_job(client, auth_headers) -> str:
    """Create a job and return its job_id."""
    payload = {"client_id": "test-client-123", "client_name": "test-client"}
    response = client.post("/api/v1/jobs", json=payload, headers=auth_headers)
    assert response.status_code == 201
    return response.json()["job_id"]


@pytest.fixture
def job_with_completed_parse_catalog(client, auth_headers, created_job, monkeypatch) -> str:
    """Create a job with a completed create-local-repository stage."""
    from core.jobs.entities import Stage
    from core.jobs.value_objects import JobId, StageName, StageState, StageType
    
    # Mock the stage repository to return a completed create-local-repository stage
    def mock_find_by_job_and_name(self, job_id, stage_name):
        # Handle JobId objects or string job_id
        job_id_str = str(job_id)
        
        if stage_name.value == StageType.CREATE_LOCAL_REPOSITORY.value:
            stage = Stage(
                job_id=JobId(job_id_str),
                stage_name=StageName(StageType.CREATE_LOCAL_REPOSITORY.value),
                stage_state=StageState.COMPLETED,
                attempt=1
            )
            return stage
        elif stage_name.value == StageType.BUILD_IMAGE_X86_64.value:
            stage = Stage(
                job_id=JobId(job_id_str),
                stage_name=StageName(StageType.BUILD_IMAGE_X86_64.value),
                stage_state=StageState.PENDING,
                attempt=1
            )
            return stage
        elif stage_name.value == StageType.BUILD_IMAGE_AARCH64.value:
            stage = Stage(
                job_id=JobId(job_id_str),
                stage_name=StageName(StageType.BUILD_IMAGE_AARCH64.value),
                stage_state=StageState.PENDING,
                attempt=1
            )
            return stage
        return None
    
    # Apply the mock - in dev mode, it uses container's stage repository
    from container import container
    monkeypatch.setattr(
        container.stage_repository().__class__,
        "find_by_job_and_name",
        mock_find_by_job_and_name
    )
    
    return created_job


================================================
FILE: build_stream/tests/integration/api/build_image/test_build_image_api.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Integration tests for Build Image API."""

import json
import tempfile
from pathlib import Path
from unittest.mock import patch

import pytest
from fastapi.testclient import TestClient

from main import app


class TestBuildImageAPI:
    """Integration tests for build image API endpoints."""

    def test_create_build_image_success_x86_64(self, client, auth_headers, job_with_completed_parse_catalog):
        """Test successful build image creation for x86_64."""
        job_id = job_with_completed_parse_catalog

        # Now trigger build image stage
        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/build-image",
            json={
                "architecture": "x86_64",
                "image_key": "test-image",
                "functional_groups": ["slurm_control_node_x86_64", "slurm_node_x86_64"]
            },
            headers=auth_headers
        )

        assert response.status_code == 202
        data = response.json()
        assert data["job_id"] == job_id
        assert data["stage"] == "build-image-x86_64"
        assert data["status"] == "accepted"
        assert data["architecture"] == "x86_64"
        assert data["image_key"] == "test-image"
        assert data["functional_groups"] == ["slurm_control_node_x86_64", "slurm_node_x86_64"]
        assert "correlation_id" in data
        assert "submitted_at" in data

    @pytest.mark.skip(reason="Requires complex config file mocking for aarch64 inventory_host")
    def test_create_build_image_success_aarch64(self, client, auth_headers, job_with_completed_parse_catalog):
        """Test successful build image creation for aarch64."""
        job_id = job_with_completed_parse_catalog

        # Trigger build image stage with inventory_host parameter
        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/build-image",
            json={
                "architecture": "aarch64",
                "image_key": "test-image",
                "functional_groups": ["slurm_control_node_aarch64"],
                "inventory_host": "172.16.0.100"
            },
            headers=auth_headers
        )

        assert response.status_code == 202
        data = response.json()
        assert data["stage"] == "build-image-aarch64"
        assert data["architecture"] == "aarch64"

    def test_create_build_image_invalid_architecture(self, client, auth_headers, job_with_completed_parse_catalog):
        """Test build image creation with invalid architecture."""
        job_id = job_with_completed_parse_catalog

        # Try with invalid architecture
        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/build-image",
            json={
                "architecture": "invalid_arch",
                "image_key": "test-image",
                "functional_groups": ["group1"]
            },
            headers=auth_headers
        )

        assert response.status_code == 422
        data = response.json()
        assert "detail" in data

    def test_create_build_image_invalid_image_key(self, client, auth_headers, job_with_completed_parse_catalog):
        """Test build image creation with invalid image key."""
        job_id = job_with_completed_parse_catalog

        # Try with invalid image key
        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/build-image",
            json={
                "architecture": "x86_64",
                "image_key": "invalid@key",
                "functional_groups": ["group1"]
            },
            headers=auth_headers
        )

        assert response.status_code == 400
        data = response.json()
        assert "detail" in data

    def test_create_build_image_aarch64_missing_inventory_host(self, client, auth_headers, job_with_completed_parse_catalog):
        """Test aarch64 build image creation without inventory host."""
        job_id = job_with_completed_parse_catalog

        # Try aarch64 without inventory host
        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/build-image",
            json={
                "architecture": "aarch64",
                "image_key": "test-image",
                "functional_groups": ["slurm_control_node_aarch64"]
            },
            headers=auth_headers
        )

        assert response.status_code == 400
        data = response.json()
        assert "detail" in data

    def test_create_build_image_unauthorized(self, client):
        """Test build image creation without authorization."""
        response = client.post(
            "/api/v1/jobs/test-job/stages/build-image",
            json={
                "architecture": "x86_64",
                "image_key": "test-image",
                "functional_groups": ["group1"]
            }
        )
        # Without auth header, may get 400 for invalid job or 401
        assert response.status_code in [400, 401]

    def test_create_build_image_job_not_found(self, client, auth_headers):
        """Test build image creation for non-existent job."""
        response = client.post(
            "/api/v1/jobs/non-existent-job/stages/build-image",
            json={
                "architecture": "x86_64",
                "image_key": "test-image",
                "functional_groups": ["group1"]
            },
            headers=auth_headers
        )
        assert response.status_code == 400
        data = response.json()
        assert "detail" in data

    @pytest.mark.skip(reason="Requires complex file system mocking for queue directory")
    def test_create_build_image_queue_submission(self, client, auth_headers, job_with_completed_parse_catalog):
        """Test that build image request is submitted to queue."""
        job_id = job_with_completed_parse_catalog

        # Create temporary queue directory
        with tempfile.TemporaryDirectory() as temp_dir:
            queue_dir = Path(temp_dir) / "requests"
            queue_dir.mkdir()

            # Mock queue path
            with patch("infra.repositories.nfs_build_image_queue_repository.NfsBuildImageQueueRepository._queue_path", str(queue_dir)):
                # Trigger build image stage
                response = client.post(
                    f"/api/v1/jobs/{job_id}/stages/build-image",
                    json={
                        "architecture": "x86_64",
                        "image_key": "test-image",
                        "functional_groups": ["group1"]
                    },
                    headers=auth_headers
                )

                assert response.status_code == 202

                # Check that request file was created in queue
                request_files = list(queue_dir.glob("*.json"))
                assert len(request_files) == 1

                # Verify request file content
                request_data = json.loads(request_files[0].read_text())
                assert request_data["job_id"] == job_id
                assert request_data["stage_name"] == "build-image"
                assert request_data["architecture"] == "x86_64"
                assert request_data["image_key"] == "test-image"
                assert request_data["functional_groups"] == ["group1"]
                assert request_data["playbook_path"] == "/omnia/build_image_x86_64/build_image_x86_64.yml"
                assert "inventory_host" not in request_data  # Not required for x86_64


================================================
FILE: build_stream/tests/integration/api/catalog_roles/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


================================================
FILE: build_stream/tests/integration/api/catalog_roles/conftest.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Shared fixtures for Catalog Roles API integration tests."""

import os
from pathlib import Path
from typing import Dict

import pytest

# Use file-based SQLite database for integration tests
@pytest.fixture(scope="function")
def client(tmp_path):
    """Create test client with fresh container for each test."""
    os.environ["ENV"] = "dev"
    # Use file-based SQLite database for integration tests
    db_file = tmp_path / "test.db"
    db_url = f"sqlite:///{db_file}"
    os.environ["DATABASE_URL"] = db_url
    
    # Import app after setting DATABASE_URL
    from main import app

    def mock_verify_token():
        return {
            "sub": "test-client-123",
            "client_id": "test-client-123",
            "scopes": ["job:write", "job:read", "catalog:read"]
        }

    from api.dependencies import verify_token
    app.dependency_overrides[verify_token] = mock_verify_token
    
    # Create database tables before starting test client
    from infra.db.models import Base
    import infra.db.config as config_module
    import importlib
    
    # Refresh db_config to pick up new DATABASE_URL
    config_module.db_config = config_module.DatabaseConfig()
    
    # Re-import session module to pick up new db_config
    import infra.db.session
    importlib.reload(infra.db.session)
    session_module = infra.db.session
    
    engine = session_module._get_engine()
    Base.metadata.create_all(engine)
    
    from fastapi.testclient import TestClient
    with TestClient(app) as test_client:
        yield test_client

    # Cleanup
    app.dependency_overrides.clear()


@pytest.fixture(name="uuid_generator")
def uuid_generator_fixture():
    """UUID generator for test fixtures."""
    from infra.id_generator import UUIDv4Generator
    return UUIDv4Generator()


@pytest.fixture(name="auth_headers")
def auth_headers_fixture(uuid_generator) -> Dict[str, str]:
    """Standard authentication headers for testing."""
    return {
        "Authorization": "Bearer test-client-123",
        "X-Correlation-Id": str(uuid_generator.generate()),
        "Idempotency-Key": f"test-key-{uuid_generator.generate()}",
    }


@pytest.fixture
def unique_correlation_id(uuid_generator) -> str:
    """Generate unique correlation ID for each test."""
    return str(uuid_generator.generate())


@pytest.fixture
def created_job(client, auth_headers) -> str:
    """Create a job and return its job_id."""
    payload = {"client_id": "test-client-123", "client_name": "test-client"}
    response = client.post("/api/v1/jobs", json=payload, headers=auth_headers)
    assert response.status_code == 201
    return response.json()["job_id"]


@pytest.fixture
def job_with_completed_parse_catalog(client, auth_headers, created_job, monkeypatch) -> str:
    """Create a job with a completed parse-catalog stage."""
    from core.jobs.entities import Stage
    from core.jobs.value_objects import JobId, StageName, StageState, StageType
    
    # Mock the stage repository to return a completed parse-catalog stage
    def mock_find_by_job_and_name(self, job_id, stage_name):
        # Handle JobId objects or string job_id
        job_id_str = str(job_id)
        
        if stage_name.value == StageType.PARSE_CATALOG.value:
            stage = Stage(
                job_id=JobId(job_id_str),
                stage_name=StageName(StageType.PARSE_CATALOG.value),
                stage_state=StageState.COMPLETED,
                attempt=1
            )
            return stage
        return None
    
    # Apply the mock - in dev mode, it uses container's stage repository
    from container import container
    monkeypatch.setattr(
        container.stage_repository().__class__,
        "find_by_job_and_name",
        mock_find_by_job_and_name
    )
    
    return created_job


================================================
FILE: build_stream/tests/integration/api/catalog_roles/test_catalog_roles_api.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""
Catalog Roles API Integration Tests

Tests the GET /jobs/{job_id}/catalog/roles endpoint including:
- Successful role retrieval after parse-catalog completes
- Authentication/authorization enforcement
- 422 when parse-catalog has not run (upstream stage not completed)
- 404 when job does not exist
- 400 for invalid job_id format
"""

import json
import os
import uuid
from typing import Any, Dict

import pytest
from fastapi.testclient import TestClient

from container import DevContainer
from main import app


class TestGetCatalogRolesAPI:  # pylint: disable=too-many-public-methods
    """Integration tests for GET /jobs/{job_id}/catalog/roles endpoint."""

    
    @pytest.fixture
    def valid_catalog_json(self) -> Dict[str, Any]:
        """Load a valid catalog JSON from fixtures."""
        here = os.path.dirname(__file__)
        fixtures_dir = os.path.abspath(
            os.path.join(here, "..", "..", "..", "fixtures", "catalogs")
        )
        catalog_path = os.path.join(fixtures_dir, "functional_layer.json")
        with open(catalog_path, "r", encoding="utf-8") as f:
            return json.load(f)

    
    @pytest.fixture
    def job_with_parsed_catalog(
        self,
        client: TestClient,
        auth_headers: Dict[str, str],
        created_job: str,
        valid_catalog_json: Dict[str, Any],
        monkeypatch,
    ) -> str:
        """Create a job and run parse-catalog so roles are available."""
        job_id = created_job

        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/parse-catalog",
            files={
                "file": (
                    "catalog.json",
                    json.dumps(valid_catalog_json),
                    "application/json",
                )
            },
            headers=auth_headers,
        )
        assert response.status_code == 200, (
            f"parse-catalog failed: {response.text}"
        )
        return job_id

    # ------------------------------------------------------------------
    # Success cases
    # ------------------------------------------------------------------

    def test_get_roles_success(
        self,
        client: TestClient,
        auth_headers: Dict[str, str],
        job_with_parsed_catalog: str,
    ) -> None:
        """Test successful role retrieval after parse-catalog completes."""
        job_id = job_with_parsed_catalog

        response = client.get(
            f"/api/v1/jobs/{job_id}/catalog/roles",
            headers=auth_headers,
        )

        assert response.status_code == 200
        data = response.json()
        assert data["job_id"] == job_id
        assert isinstance(data["roles"], list)
        assert len(data["roles"]) > 0
        # All roles must be non-empty strings
        for role in data["roles"]:
            assert isinstance(role, str)
            assert len(role) > 0

    def test_get_roles_returns_sorted_list(
        self,
        client: TestClient,
        auth_headers: Dict[str, str],
        job_with_parsed_catalog: str,
    ) -> None:
        """Test that roles are returned in sorted order."""
        job_id = job_with_parsed_catalog

        response = client.get(
            f"/api/v1/jobs/{job_id}/catalog/roles",
            headers=auth_headers,
        )

        assert response.status_code == 200
        roles = response.json()["roles"]
        assert roles == sorted(roles)

    def test_get_roles_response_schema(
        self,
        client: TestClient,
        auth_headers: Dict[str, str],
        job_with_parsed_catalog: str,
    ) -> None:
        """Test that the response matches the expected schema."""
        job_id = job_with_parsed_catalog

        response = client.get(
            f"/api/v1/jobs/{job_id}/catalog/roles",
            headers=auth_headers,
        )

        assert response.status_code == 200
        data = response.json()
        assert "job_id" in data
        assert "roles" in data
        assert data["job_id"] == job_id

    def test_get_roles_returns_correlation_id(
        self,
        client: TestClient,
        auth_headers: Dict[str, str],
        unique_correlation_id: str,
        job_with_parsed_catalog: str,
    ) -> None:
        """Test that correlation ID is returned in response."""
        job_id = job_with_parsed_catalog

        response = client.get(
            f"/api/v1/jobs/{job_id}/catalog/roles",
            headers=auth_headers,
        )
        assert response.status_code == 200
        data = response.json()
        assert "correlation_id" in data
        assert data["correlation_id"] == unique_correlation_id

    # ------------------------------------------------------------------
    # Authentication / Authorization
    # ------------------------------------------------------------------

    def test_get_roles_no_auth_returns_401(
        self,
        client: TestClient,
        job_with_parsed_catalog: str,
    ) -> None:
        """Test that missing Authorization header returns 401."""
        job_id = job_with_parsed_catalog

        response = client.get(f"/api/v1/jobs/{job_id}/catalog/roles")

        assert response.status_code == 401
        assert "detail" in response.json()

    def test_get_roles_invalid_token_returns_401(
        self,
        client: TestClient,
        created_job: str,
    ) -> None:
        """Test that an invalid token returns 401 (without mock_jwt_validation)."""
        job_id = created_job

        response = client.get(
            f"/api/v1/jobs/{job_id}/catalog/roles",
            headers={"Authorization": "Bearer totally-invalid-token"},
        )

        # With real JWT validation this returns 401; with mock it may return 404
        assert response.status_code in [401, 404]

    def test_get_roles_requires_job_read_scope(
        self, client: TestClient, job_with_parsed_catalog: str
    ) -> None:
        """Test that job:read scope is required."""
        job_id = job_with_parsed_catalog

        response = client.get(f"/api/v1/jobs/{job_id}/catalog/roles")

        assert response.status_code == 401
        assert "detail" in response.json()

    # ------------------------------------------------------------------
    # Job not found / upstream stage not completed
    # ------------------------------------------------------------------

    def test_get_roles_nonexistent_job_returns_404(
        self,
        client: TestClient,
        auth_headers: Dict[str, str],
    ) -> None:
        """Test that a non-existent job_id returns 404."""
        fake_job_id = "019bf590-1234-7890-abcd-ef1234567890"

        response = client.get(
            f"/api/v1/jobs/{fake_job_id}/catalog/roles",
            headers=auth_headers,
        )

        assert response.status_code == 404
        data = response.json()
        assert data["detail"]["error_code"] == "JOB_NOT_FOUND"

    def test_get_roles_upstream_stage_not_completed(
        self,
        client: TestClient,
        auth_headers: Dict[str, str],
        created_job: str,
    ) -> None:
        """Test 422 when parse-catalog has not run."""
        job_id = created_job

        response = client.get(
            f"/api/v1/jobs/{job_id}/catalog/roles",
            headers=auth_headers,
        )

        assert response.status_code == 412
        data = response.json()
        assert data["detail"]["error"] == "UPSTREAM_STAGE_NOT_COMPLETED"

    # ------------------------------------------------------------------
    # Input validation
    # ------------------------------------------------------------------

    def test_get_roles_invalid_job_id_format_returns_400(
        self,
        client: TestClient,
        auth_headers: Dict[str, str],
    ) -> None:
        """Test that a malformed job_id returns 400."""
        response = client.get(
            "/api/v1/jobs/not-a-valid-uuid/catalog/roles",
            headers=auth_headers,
        )

        assert response.status_code == 400
        data = response.json()
        assert data["detail"]["error_code"] == "INVALID_JOB_ID"

    # ------------------------------------------------------------------
    # Error response structure
    # ------------------------------------------------------------------

    def test_error_response_does_not_expose_internals(
        self,
        client: TestClient,
        auth_headers: Dict[str, str],
    ) -> None:
        """Test that error responses do not expose stack traces or file paths."""
        fake_job_id = "019bf590-dead-beef-abcd-ef1234567890"

        response = client.get(
            f"/api/v1/jobs/{fake_job_id}/catalog/roles",
            headers=auth_headers,
        )

        assert response.status_code == 404
        message = response.json()["detail"]["message"]
        assert "traceback" not in message.lower()
        assert ".py" not in message


================================================
FILE: build_stream/tests/integration/api/conftest.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Shared fixtures for API integration tests."""

import os
from typing import Dict, Generator
from unittest.mock import patch

import pytest
from fastapi.testclient import TestClient

from main import app
from infra.id_generator import UUIDv4Generator


@pytest.fixture(scope="function")
def client() -> TestClient:
    """Create test client with fresh container for each test."""
    os.environ["ENV"] = "dev"
    return TestClient(app)


@pytest.fixture(name="uuid_generator")
def uuid_generator_fixture() -> UUIDv4Generator:
    """UUID generator for test fixtures."""
    return UUIDv4Generator()


@pytest.fixture
def auth_headers(uuid_generator: UUIDv4Generator) -> Dict[str, str]:
    """Standard authentication headers for testing."""
    return {
        "Authorization": "Bearer test-client-123",
        "X-Correlation-Id": str(uuid_generator.generate()),
        "Idempotency-Key": f"test-key-{uuid_generator.generate()}",
    }


@pytest.fixture
def mock_jwt_validation() -> Generator[None, None, None]:
    """Mock JWT validation for integration tests.
    
    This fixture bypasses JWT validation to allow testing of API endpoints
    without requiring actual JWT keys.
    """
    with patch("api.auth.jwt_handler.JWTHandler.validate_token") as mock_validate:
        # Mock successful token validation
        from api.auth.jwt_handler import TokenData
        from datetime import datetime, timezone, timedelta
        
        now = datetime.now(timezone.utc)
        mock_validate.return_value = TokenData(
            client_id="test-client",
            client_name="test-client",
            scopes=["catalog:read", "catalog:write"],
            issued_at=now,
            expires_at=now + timedelta(hours=1),
            token_id="test-token-id",
        )
        yield


@pytest.fixture
def auth_headers_with_mock(mock_jwt_validation: None, uuid_generator: UUIDv4Generator) -> Dict[str, str]:
    """Authentication headers with mocked JWT validation."""
    return {
        "Authorization": "Bearer test-token",
        "X-Correlation-Id": str(uuid_generator.generate()),
        "Idempotency-Key": f"test-key-{uuid_generator.generate()}",
    }


================================================
FILE: build_stream/tests/integration/api/generate_input_files/conftest.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Shared fixtures for Generate Input Files API integration tests."""

import os
from pathlib import Path
from typing import Dict

import pytest

# Use file-based SQLite database for integration tests
@pytest.fixture(scope="function")
def client(tmp_path):
    """Create test client with fresh container for each test."""
    os.environ["ENV"] = "dev"
    # Use file-based SQLite database for integration tests
    db_file = tmp_path / "test.db"
    db_url = f"sqlite:///{db_file}"
    os.environ["DATABASE_URL"] = db_url
    
    # Import app after setting DATABASE_URL
    from main import app

    def mock_verify_token():
        return {
            "sub": "test-client-123",
            "client_id": "test-client-123",
            "scopes": ["job:write", "job:read"]
        }

    from api.dependencies import verify_token
    app.dependency_overrides[verify_token] = mock_verify_token
    
    # Create database tables before starting test client
    from infra.db.models import Base
    import infra.db.config as config_module
    import importlib
    
    # Refresh db_config to pick up new DATABASE_URL
    config_module.db_config = config_module.DatabaseConfig()
    
    # Re-import session module to pick up new db_config
    import infra.db.session
    importlib.reload(infra.db.session)
    session_module = infra.db.session
    
    engine = session_module._get_engine()
    Base.metadata.create_all(engine)
    
    from fastapi.testclient import TestClient
    with TestClient(app) as test_client:
        yield test_client

    # Cleanup
    app.dependency_overrides.clear()


@pytest.fixture(name="uuid_generator")
def uuid_generator_fixture():
    """UUID generator for test fixtures."""
    from infra.id_generator import UUIDv4Generator
    return UUIDv4Generator()


@pytest.fixture(name="auth_headers")
def auth_headers_fixture(uuid_generator) -> Dict[str, str]:
    """Standard authentication headers for testing."""
    return {
        "Authorization": "Bearer test-client-123",
        "X-Correlation-Id": str(uuid_generator.generate()),
        "Idempotency-Key": f"test-key-{uuid_generator.generate()}",
    }


@pytest.fixture
def unique_correlation_id(uuid_generator) -> str:
    """Generate unique correlation ID for each test."""
    return str(uuid_generator.generate())


@pytest.fixture
def created_job(client, auth_headers) -> str:
    """Create a job and return its job_id."""
    payload = {"client_id": "test-client-123", "client_name": "test-client"}
    response = client.post("/api/v1/jobs", json=payload, headers=auth_headers)
    assert response.status_code == 201
    return response.json()["job_id"]


================================================
FILE: build_stream/tests/integration/api/generate_input_files/test_generate_input_files_api.py
================================================
"""
GenerateInputFiles API Integration Tests

Tests the complete API endpoint behavior including:
- Request validation and authentication
- Successful execution with artifact storage
- Error responses (invalid paths, missing dependencies)
- Authentication/authorization
- Cross-stage artifact dependencies
"""

import json
import os
import threading
import uuid
from typing import Dict, Any

import pytest

from fastapi.testclient import TestClient

from main import app
from container import DevContainer


class TestGenerateInputFilesAPI:  # pylint: disable=too-many-public-methods
    """Integration tests for GenerateInputFiles API endpoint."""

    @pytest.fixture
    def client(self) -> TestClient:
        """Create test client with in-memory stores."""
        container = DevContainer()
        container.wire(modules=["api.generate_input_files.routes"])

        with TestClient(app) as client:
            yield client

    @pytest.fixture
    def auth_headers(self, mock_jwt_validation) -> Dict[str, str]:  # pylint: disable=unused-argument
        """Create authentication headers."""
        return {
            "Authorization": "Bearer test-token",
            "X-Correlation-ID": str(uuid.uuid4()),
            "Idempotency-Key": f"test-key-{uuid.uuid4()}",
        }

    @pytest.fixture
    def valid_job_id(self) -> str:
        """Generate a valid job ID for testing."""
        return str(uuid.uuid4())

    @pytest.fixture
    def valid_request_data(self) -> Dict[str, Any]:
        """Valid request data for generate input files."""
        return {}  # Empty request uses default policy

    @pytest.fixture
    def custom_policy_request_data(self) -> Dict[str, Any]:
        """Request data with custom adapter policy."""
        return {
            "adapter_policy_path": "/opt/omnia/policies/custom_policy.json"
        }

    @pytest.fixture
    def created_job(self, client: TestClient, auth_headers: Dict[str, str]) -> Dict[str, Any]:
        """Create a fresh job for each test."""
        # Use unique idempotency key to ensure fresh job creation
        headers = auth_headers.copy()
        headers["Idempotency-Key"] = f"test-key-{uuid.uuid4()}"

        response = client.post(
            "/api/v1/jobs",
            json={"client_id": "test-client"},
            headers=headers,
        )
        assert response.status_code == 201
        return response.json()

    def test_endpoint_exists_and_requires_auth(self, client: TestClient, valid_job_id: str) -> None:
        """Test that the endpoint exists and requires authentication."""
        response = client.post(
            f"/api/v1/jobs/{valid_job_id}/stages/generate-input-files"
        )
        
        # Should not be 404 (endpoint exists)
        assert response.status_code != 404
        # Should require authentication
        assert response.status_code == 401

    def test_valid_request_structure(self, client: TestClient, auth_headers: Dict[str, str], created_job: Dict[str, Any]) -> None:
        """Test generate input files with valid request structure."""
        job_id = created_job["job_id"]
        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/generate-input-files",
            headers=auth_headers,
            json={}
        )

        # Should accept the request structure (may fail due to missing dependencies)
        assert response.status_code in [200, 400, 422, 500]

    def test_request_with_custom_policy(self, client: TestClient, auth_headers: Dict[str, str], created_job: Dict[str, Any], custom_policy_request_data: Dict[str, Any]) -> None:
        """Test generate input files with custom adapter policy."""
        job_id = created_job["job_id"]
        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/generate-input-files",
            headers=auth_headers,
            json=custom_policy_request_data
        )

        # Should accept the custom policy path (may fail due to missing file/job)
        assert response.status_code in [200, 400, 422, 500]

    def test_missing_correlation_id(self, client: TestClient, created_job: Dict[str, Any]) -> None:
        """Test that correlation ID is required."""
        job_id = created_job["job_id"]
        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/generate-input-files",
            headers={"Authorization": "Bearer test-token"},
        )
        
        assert response.status_code == 422

    def test_invalid_job_id_format(self, client: TestClient, auth_headers: Dict[str, str]) -> None:
        """Test generate input files with invalid job ID format."""
        response = client.post(
            "/api/v1/jobs/invalid-uuid/stages/generate-input-files",
            headers=auth_headers
        )
        
        # Should validate job ID format (may return 400 or 422)
        assert response.status_code in [400, 422]

    def test_path_traversal_protection(self, client: TestClient, auth_headers: Dict[str, str], created_job: Dict[str, Any]) -> None:
        """Test that path traversal attempts are blocked."""
        job_id = created_job["job_id"]
        malicious_paths = [
            "../../../etc/passwd",
            "..\\..\\windows\\system32\\config\\sam",
            "/etc/shadow",
            "....//....//....//etc/passwd"
        ]
        
        for malicious_path in malicious_paths:
            request_data = {"adapter_policy_path": malicious_path}
            response = client.post(
                f"/api/v1/jobs/{job_id}/stages/generate-input-files",
                headers=auth_headers,
                json=request_data
            )
            
            # Should reject path traversal attempts
            assert response.status_code in [400, 422]

    def test_invalid_json_request(self, client: TestClient, auth_headers: Dict[str, str], created_job: Dict[str, Any]) -> None:
        """Test generate input files with invalid JSON."""
        job_id = created_job["job_id"]
        headers_with_content_type = {**auth_headers, "Content-Type": "application/json"}
        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/generate-input-files",
            headers=headers_with_content_type,
            data="not json content"
        )
        
        assert response.status_code == 422

    def test_empty_request_body(self, client: TestClient, auth_headers: Dict[str, str], created_job: Dict[str, Any]) -> None:
        """Test generate input files with empty request body."""
        job_id = created_job["job_id"]
        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/generate-input-files",
            headers=auth_headers,
            data=""
        )
        
        # Should handle empty body gracefully
        assert response.status_code in [200, 400, 422, 500]

    def test_concurrent_requests(self, client: TestClient, auth_headers: Dict[str, str], created_job: Dict[str, Any]) -> None:
        """Test concurrent requests to the same job."""
        job_id = created_job["job_id"]
        def make_request():
            return client.post(
                f"/api/v1/jobs/{job_id}/stages/generate-input-files",
                headers=auth_headers,
                json={}
            )
        
        # Make concurrent requests
        threads = []
        responses = []
        
        for _ in range(3):
            thread = threading.Thread(target=lambda: responses.append(make_request()))
            threads.append(thread)
            thread.start()
        
        # Wait for all threads to complete
        for thread in threads:
            thread.join()
        
        # All requests should be processed (may succeed or fail gracefully)
        for response in responses:
            assert response.status_code in [200, 400, 422, 500]

    def test_response_structure_on_success(self, client: TestClient, auth_headers: Dict[str, str], created_job: Dict[str, Any]) -> None:
        """Test that successful response has correct structure."""
        job_id = created_job["job_id"]
        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/generate-input-files",
            headers=auth_headers,
            json={}
        )
        
        if response.status_code == 200:
            data = response.json()
            
            # Should have required fields
            assert "stage_state" in data
            assert data["stage_state"] in ["COMPLETED", "FAILED"]
            
            # If completed, should have generated files
            if data["stage_state"] == "COMPLETED":
                assert "generated_files" in data
                assert isinstance(data["generated_files"], list)
                
                # Each generated file should have required fields
                for generated_file in data["generated_files"]:
                    assert "filename" in generated_file
                    assert "artifact_ref" in generated_file
                    
                    artifact_ref = generated_file["artifact_ref"]
                    assert "key" in artifact_ref
                    assert "digest" in artifact_ref
                    assert "size_bytes" in artifact_ref
                    assert "uri" in artifact_ref

    def test_error_response_structure(self, client: TestClient, auth_headers: Dict[str, str], created_job: Dict[str, Any]) -> None:
        """Test that error responses have correct structure."""
        job_id = created_job["job_id"]
        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/generate-input-files",
            headers=auth_headers,
            json={"adapter_policy_path": "/nonexistent/path/policy.json"}
        )
        
        if response.status_code in [400, 422]:
            data = response.json()
            
            # Should have error information - check for common error response formats
            assert "detail" in data or "error" in data or "message" in data
            
            # Check the actual structure based on what's present
            if "detail" in data:
                if isinstance(data["detail"], dict):
                    # detail is a dict containing error and message
                    detail_dict = data["detail"]
                    if "error" in detail_dict:
                        assert isinstance(detail_dict["error"], str)
                    if "message" in detail_dict:
                        assert isinstance(detail_dict["message"], str)
                else:
                    # detail is a string
                    assert isinstance(data["detail"], str)
            elif "error" in data and "message" in data:
                # This API returns error and message fields at top level
                assert isinstance(data["error"], str)
                assert isinstance(data["message"], str)
            else:
                # If we have either error or message at top level, check it's a string
                if "error" in data:
                    assert isinstance(data["error"], str)
                if "message" in data:
                    assert isinstance(data["message"], str)

    def test_job_not_found_error(self, client: TestClient, auth_headers: Dict[str, str]) -> None:
        """Test behavior when job doesn't exist."""
        nonexistent_job_id = str(uuid.uuid4())
        
        response = client.post(
            f"/api/v1/jobs/{nonexistent_job_id}/stages/generate-input-files",
            headers=auth_headers,
            json={}
        )
        
        # Should handle nonexistent job gracefully
        assert response.status_code in [400, 404, 422, 500]

    def test_dependency_validation(self, client: TestClient, auth_headers: Dict[str, str], created_job: Dict[str, Any]) -> None:
        """Test that dependencies on parse catalog are validated."""
        job_id = created_job["job_id"]
        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/generate-input-files",
            headers=auth_headers,
            json={}
        )
        
        # May fail due to missing parse catalog artifacts
        if response.status_code in [400, 422]:
            data = response.json()
            # Should indicate dependency issue if that's the problem
            detail = data.get("detail", {})
            if isinstance(detail, dict):
                # detail is a dict, check error and message fields
                error_text = detail.get("error", "")
                message_text = detail.get("message", "")
                combined_text = f"{error_text} {message_text}".lower()
            else:
                # detail is a string
                combined_text = str(detail).lower()
            
            dependency_keywords = ["dependency", "prerequisite", "catalog", "artifact"]
            has_dependency_error = any(keyword in combined_text for keyword in dependency_keywords)
            # This is optional - the exact error handling may vary
            # assert has_dependency_error

    def test_policy_file_not_found(self, client: TestClient, auth_headers: Dict[str, str], created_job: Dict[str, Any]) -> None:
        """Test behavior when custom policy file doesn't exist."""
        job_id = created_job["job_id"]
        request_data = {
            "adapter_policy_path": "/nonexistent/custom_policy.json"
        }
        
        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/generate-input-files",
            headers=auth_headers,
            json=request_data
        )
        
        # Should handle missing policy file
        assert response.status_code in [400, 422, 500]

    def test_idempotency_key_handling(self, client: TestClient, auth_headers: Dict[str, str], created_job: Dict[str, Any]) -> None:
        """Test that idempotency key is properly handled."""
        job_id = created_job["job_id"]
        # Make the same request twice with same idempotency key
        request_data = {}
        
        response1 = client.post(
            f"/api/v1/jobs/{job_id}/stages/generate-input-files",
            headers=auth_headers,
            json=request_data
        )
        
        response2 = client.post(
            f"/api/v1/jobs/{job_id}/stages/generate-input-files",
            headers=auth_headers,
            json=request_data
        )
        
        # Both should be processed (idempotency behavior may vary)
        assert response1.status_code in [200, 400, 422, 500]
        assert response2.status_code in [200, 400, 422, 500]

    def test_large_policy_path(self, client: TestClient, auth_headers: Dict[str, str], created_job: Dict[str, Any]) -> None:
        """Test handling of unusually long policy paths."""
        job_id = created_job["job_id"]
        long_path = "/opt/omnia/" + "very_long_subdirectory_name/" * 20 + "policy.json"
        
        request_data = {"adapter_policy_path": long_path}
        
        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/generate-input-files",
            headers=auth_headers,
            json=request_data
        )
        
        # Should handle long paths gracefully (may fail validation)
        assert response.status_code in [200, 400, 422, 500]

    def test_special_characters_in_policy_path(self, client: TestClient, auth_headers: Dict[str, str], created_job: Dict[str, Any]) -> None:
        """Test handling of special characters in policy paths."""
        job_id = created_job["job_id"]
        special_paths = [
            "/opt/omnia/policy with spaces.json",
            "/opt/omnia/policy-with-dashes.json",
            "/opt/omnia/policy_with_underscores.json",
            "/opt/omnia/policy.with.dots.json"
        ]
        
        for special_path in special_paths:
            request_data = {"adapter_policy_path": special_path}
            response = client.post(
                f"/api/v1/jobs/{job_id}/stages/generate-input-files",
                headers=auth_headers,
                json=request_data
            )
            
            # Should handle special characters (may fail if file doesn't exist)
            assert response.status_code in [200, 400, 422, 500]


================================================
FILE: build_stream/tests/integration/api/generate_input_files/test_generate_input_files_artifact_integration.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Integration tests for generate input files API with artifact storage."""

import json
import os
import shutil
import tempfile
import uuid
from pathlib import Path

import pytest

from common.config import load_config
from container import container
from core.artifacts.value_objects import ArtifactKind, StoreHint
from core.jobs.value_objects import ClientId, CorrelationId, IdempotencyKey, JobId
from infra.artifact_store.file_artifact_store import FileArtifactStore
from orchestrator.catalog.commands.generate_input_files import GenerateInputFilesCommand
from orchestrator.jobs.commands import CreateJobCommand


class TestGenerateInputFilesArtifactStorage:  # pylint: disable=attribute-defined-outside-init
    """Integration tests for generate input files with file-based artifact storage."""

    def setup_method(self) -> None:
        """Set up test environment with temporary file store directory."""
        self.temp_file_dir = None
        self.original_env = None
        self.config_file = None

        self.temp_file_dir = tempfile.mkdtemp(prefix="test_generate_input_files_")
        self.original_env = os.environ.get("BUILD_STREAM_CONFIG_PATH")
        self.config_file = None

        # Create a test config file
        self.config_file = Path(self.temp_file_dir) / "test_config.ini"
        self.config_file.write_text(f"""[artifact_store]
backend = file_store
working_dir = {self.temp_file_dir}/working

[file_store]
base_path = {self.temp_file_dir}/artifacts
""")

        # Set config path for container
        os.environ["BUILD_STREAM_CONFIG_PATH"] = str(self.config_file)
        container.wire(modules=[__name__])

    def teardown_method(self) -> None:
        """Clean up test environment."""
        if self.original_env:
            os.environ["BUILD_STREAM_CONFIG_PATH"] = self.original_env
        else:
            os.environ.pop("BUILD_STREAM_CONFIG_PATH", None)

        # Clean up temp directory
        if Path(self.temp_file_dir).exists():
            shutil.rmtree(self.temp_file_dir)

        # Reset container
        container.unwire()
        container.reset_singletons()

    def test_file_artifact_store_is_used_when_enabled(self) -> None:
        """Test that FileArtifactStore is used when enabled in config."""
        artifact_store = container.artifact_store()
        assert isinstance(artifact_store, FileArtifactStore)

    def test_generate_input_files_creates_artifacts_on_file_store(self) -> None:  # pylint: disable=too-many-locals
        """Test that generate input files creates artifact files on file store."""
        # Create job first
        create_job_use_case = container.create_job_use_case()
        job_command = CreateJobCommand(
            client_id=ClientId("test-client"),
            request_client_id="test-client",
            correlation_id=CorrelationId(str(uuid.uuid4())),
            idempotency_key=IdempotencyKey(str(uuid.uuid4())),
            client_name="Test Client",
        )
        job_result = create_job_use_case.execute(job_command)
        job_id = JobId(job_result.job_id)

        # First execute parse catalog to create prerequisite artifacts
        parse_catalog_use_case = container.parse_catalog_use_case()
        
        # Create a simple catalog for testing
        catalog_data = {
            "Catalog": {
                "Name": "Test Catalog",
                "Version": "1.0.0",
                "FunctionalLayer": "test-functional",
                "BaseOS": "rhel",
                "Infrastructure": "kubernetes",
                "FunctionalPackages": {
                    "monitoring": {
                        "Version": "1.0.0",
                        "Source": "test"
                    }
                },
                "OSPackages": {
                    "base": {
                        "Version": "9.0",
                        "Source": "test"
                    }
                },
                "InfrastructurePackages": {
                    "kubernetes": {
                        "Version": "1.28",
                        "Source": "test"
                    }
                },
                "DriverPackages": {}
            }
        }
        
        catalog_bytes = json.dumps(catalog_data).encode('utf-8')
        
        # Import the correct command for parse catalog
        from orchestrator.catalog.commands.parse_catalog import ParseCatalogCommand
        
        parse_command = ParseCatalogCommand(
            job_id=job_id,
            correlation_id=CorrelationId(str(uuid.uuid4())),
            filename="catalog.json",
            content=catalog_bytes,
        )
        
        # Execute parse catalog first (this will create the necessary artifacts)
        try:
            parse_result = parse_catalog_use_case.execute(parse_command)
            # If parse catalog succeeds, then try generate input files
            generate_input_files_use_case = container.generate_input_files_use_case()
            command = GenerateInputFilesCommand(
                job_id=job_id,
                correlation_id=CorrelationId(str(uuid.uuid4())),
                adapter_policy_path=None,  # Use default policy
            )
            
            # Execute generate input files
            result = generate_input_files_use_case.execute(command)
            
            # Verify the result structure
            assert result is not None
            assert hasattr(result, 'stage_state')
            assert hasattr(result, 'generated_files')
            
            # Check that artifacts were created in the file store
            artifact_store = container.artifact_store()
            base_path = Path(self.temp_file_dir) / "artifacts"
            
            # Look for generated files in the artifact store
            artifact_files = list(base_path.rglob("*.json"))
            
            # Should have at least some files generated (even if the process failed partially)
            # The exact number depends on the policy and catalog content
            assert len(artifact_files) >= 0  # Allow for empty result in case of failures
            
            # If files were generated, verify they contain valid JSON
            for artifact_file in artifact_files:
                assert artifact_file.exists()
                with open(artifact_file, 'r', encoding='utf-8') as f:
                    content = f.read()
                    # Should be valid JSON (even if empty or error response)
                    try:
                        json.loads(content)
                    except json.JSONDecodeError:
                        # If it's not JSON, it might be an error log or other output
                        assert isinstance(content, str)
        
        except Exception as e:
            # If parse catalog fails, generate input files should also fail
            # This is expected behavior - generate input files depends on parse catalog
            generate_input_files_use_case = container.generate_input_files_use_case()
            command = GenerateInputFilesCommand(
                job_id=job_id,
                correlation_id=CorrelationId(str(uuid.uuid4())),
                adapter_policy_path=None,
            )
            
            # Should fail due to missing upstream stage
            with pytest.raises(Exception):  # Should raise UpstreamStageNotCompletedError or similar
                generate_input_files_use_case.execute(command)

    def test_generate_input_files_with_custom_policy_creates_artifacts(self) -> None:  # pylint: disable=too-many-locals
        """Test that generate input files with custom policy creates artifacts."""
        # Create job first
        create_job_use_case = container.create_job_use_case()
        job_command = CreateJobCommand(
            client_id=ClientId("test-client"),
            request_client_id="test-client",
            correlation_id=CorrelationId(str(uuid.uuid4())),
            idempotency_key=IdempotencyKey(str(uuid.uuid4())),
            client_name="Test Client",
        )
        job_result = create_job_use_case.execute(job_command)
        job_id = JobId(job_result.job_id)

        # Create a custom policy file
        custom_policy = {
            "targets": {
                "x86_64/rhel/9.0": {
                    "omnia_config": {
                        "template": "test_template.json",
                        "variables": {
                            "cluster_name": "test-cluster"
                        }
                    }
                }
            }
        }
        
        policy_file = Path(self.temp_file_dir) / "custom_policy.json"
        policy_file.write_text(json.dumps(custom_policy, indent=2))
        
        # First, try to run parse catalog to create prerequisite artifacts
        parse_catalog_use_case = container.parse_catalog_use_case()
        
        # Create a simple catalog for testing
        catalog_data = {
            "Catalog": {
                "Name": "Test Catalog",
                "Version": "1.0.0",
                "FunctionalLayer": "test-functional",
                "BaseOS": "rhel",
                "Infrastructure": "kubernetes",
                "FunctionalPackages": {},
                "OSPackages": {},
                "InfrastructurePackages": {},
                "DriverPackages": {}
            }
        }
        
        catalog_bytes = json.dumps(catalog_data).encode('utf-8')
        
        from orchestrator.catalog.commands.parse_catalog import ParseCatalogCommand
        
        parse_command = ParseCatalogCommand(
            job_id=job_id,
            correlation_id=CorrelationId(str(uuid.uuid4())),
            filename="catalog.json",
            content=catalog_bytes,
        )
        
        # Try to execute parse catalog first
        try:
            parse_result = parse_catalog_use_case.execute(parse_command)
            # If parse catalog succeeds, then try generate input files
            generate_input_files_use_case = container.generate_input_files_use_case()
            command = GenerateInputFilesCommand(
                job_id=job_id,
                correlation_id=CorrelationId(str(uuid.uuid4())),
                adapter_policy_path=policy_file,
            )
            
            # Execute generate input files
            result = generate_input_files_use_case.execute(command)
            
            # Verify the result structure
            assert result is not None
            assert hasattr(result, 'stage_state')
            assert hasattr(result, 'generated_files')
            
            # Check that artifacts were created
            artifact_store = container.artifact_store()
            base_path = Path(self.temp_file_dir) / "artifacts"
            
            # Look for generated files
            artifact_files = list(base_path.rglob("*.json"))
            assert len(artifact_files) >= 0
            
        except Exception:
            # If parse catalog fails, generate input files should also fail
            generate_input_files_use_case = container.generate_input_files_use_case()
            command = GenerateInputFilesCommand(
                job_id=job_id,
                correlation_id=CorrelationId(str(uuid.uuid4())),
                adapter_policy_path=policy_file,
            )
            
            # Should fail due to missing upstream stage
            with pytest.raises(Exception):
                generate_input_files_use_case.execute(command)

    def test_generate_input_files_handles_missing_prerequisites(self) -> None:
        """Test that generate input files handles missing parse catalog artifacts gracefully."""
        # Create job first
        create_job_use_case = container.create_job_use_case()
        job_command = CreateJobCommand(
            client_id=ClientId("test-client"),
            request_client_id="test-client",
            correlation_id=CorrelationId(str(uuid.uuid4())),
            idempotency_key=IdempotencyKey(str(uuid.uuid4())),
            client_name="Test Client",
        )
        job_result = create_job_use_case.execute(job_command)
        job_id = JobId(job_result.job_id)

        # Execute generate input files without running parse catalog first
        generate_input_files_use_case = container.generate_input_files_use_case()
        command = GenerateInputFilesCommand(
            job_id=job_id,
            correlation_id=CorrelationId(str(uuid.uuid4())),
            adapter_policy_path=None,  # Use default policy
        )
        
        # Should handle missing prerequisites gracefully
        try:
            result = generate_input_files_use_case.execute(command)
            # If it succeeds, verify the result structure
            assert result is not None
            assert hasattr(result, 'stage_state')
        except Exception as e:
            # If it fails, it should be a meaningful error about missing prerequisites
            assert "prerequisite" in str(e).lower() or "dependency" in str(e).lower() or "artifact" in str(e).lower() or "upstream" in str(e).lower()

    def test_generate_input_files_artifact_metadata(self) -> None:
        """Test that generate input files creates proper artifact metadata."""
        # Create job first
        create_job_use_case = container.create_job_use_case()
        job_command = CreateJobCommand(
            client_id=ClientId("test-client"),
            request_client_id="test-client",
            correlation_id=CorrelationId(str(uuid.uuid4())),
            idempotency_key=IdempotencyKey(str(uuid.uuid4())),
            client_name="Test Client",
        )
        job_result = create_job_use_case.execute(job_command)
        job_id = JobId(job_result.job_id)

        # Execute generate input files
        generate_input_files_use_case = container.generate_input_files_use_case()
        command = GenerateInputFilesCommand(
            job_id=job_id,
            correlation_id=CorrelationId(str(uuid.uuid4())),
            adapter_policy_path=None,
        )
        
        # Execute the command
        try:
            result = generate_input_files_use_case.execute(command)
            
            # Check artifact metadata repository
            artifact_metadata_repo = container.artifact_metadata_repository()
            
            # Look for metadata related to this job
            # (The exact implementation depends on how metadata is stored)
            assert artifact_metadata_repo is not None
            
        except Exception:
            # If the execution fails, we still verify the repository exists
            artifact_metadata_repo = container.artifact_metadata_repository()
            assert artifact_metadata_repo is not None


================================================
FILE: build_stream/tests/integration/api/generate_input_files/test_generate_input_files_routes.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Integration tests for Generate Input Files API routes."""

import json
import uuid
from typing import Dict, Any

import pytest
from fastapi.testclient import TestClient

from main import app
from container import DevContainer


class TestGenerateInputFilesRoutes:
    """Integration tests for generate input files API endpoints."""

    
    def test_generate_input_files_endpoint_exists(self, client: TestClient) -> None:
        """Test that the generate input files endpoint exists and is accessible."""
        # Test with invalid auth to check endpoint exists (should get 401, not 404)
        response = client.post(
            "/api/v1/jobs/invalid-job-id/stages/generate-input-files",
            headers={"Authorization": "Bearer invalid-token"},
        )
        
        # Should not be 404 (endpoint exists)
        assert response.status_code != 404
        # Should be 401 (auth required), 403 (forbidden), or 422 (validation error)
        assert response.status_code in [401, 403, 422]

    def test_generate_input_files_with_valid_request(self, client: TestClient, auth_headers: Dict[str, str], created_job: str) -> None:
        """Test generate input files with valid request structure."""
        job_id = created_job
        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/generate-input-files",
            headers=auth_headers,
            json={}
        )

        # Should accept the request structure (may fail due to missing dependencies)
        assert response.status_code in [200, 400, 422, 500]

    def test_generate_input_files_with_custom_policy(self, client: TestClient, auth_headers: Dict[str, str], created_job: str) -> None:
        """Test generate input files with custom adapter policy."""
        job_id = created_job
        request_data = {
            "adapter_policy_path": "/opt/omnia/custom_policy.json"
        }

        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/generate-input-files",
            json=request_data,
            headers=auth_headers,
        )

        # Should accept the custom policy path (may fail due to missing file/job)
        assert response.status_code in [200, 400, 422, 500]

    def test_generate_input_files_requires_authentication(self, client: TestClient) -> None:
        """Test that generate input files endpoint requires authentication."""
        response = client.post(
            "/api/v1/jobs/invalid-job-id/stages/generate-input-files",
        )
        
        # Should require authentication
        assert response.status_code == 401

    def test_generate_input_files_requires_correlation_id(self, client: TestClient, created_job: str) -> None:
        """Test that generate input files endpoint requires correlation ID."""
        job_id = created_job
        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/generate-input-files",
            headers={"Authorization": "Bearer test-token"},
        )
        
        # Should require correlation ID
        assert response.status_code == 422

    def test_generate_input_files_invalid_job_id_format(self, client: TestClient, auth_headers: Dict[str, str]) -> None:
        """Test generate input files with invalid job ID format."""
        response = client.post(
            "/api/v1/jobs/invalid-uuid/stages/generate-input-files",
            headers=auth_headers
        )
        
        # Should validate job ID format (may return 400 or 422)
        assert response.status_code in [400, 422]

    def test_generate_input_files_invalid_policy_path(self, client: TestClient, auth_headers: Dict[str, str], created_job: str) -> None:
        """Test generate input files with invalid adapter policy path."""
        job_id = created_job
        request_data = {
            "adapter_policy_path": "../../../etc/passwd"  # Path traversal attempt
        }

        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/generate-input-files",
            headers=auth_headers,
            json=request_data
        )
        
        # Should reject path traversal attempts
        assert response.status_code in [400, 422]

    def test_generate_input_files_empty_policy_path(self, client: TestClient, auth_headers: Dict[str, str], created_job: str) -> None:
        """Test generate input files with empty adapter policy path."""
        job_id = created_job
        request_data = {
            "adapter_policy_path": ""
        }

        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/generate-input-files",
            json=request_data,
            headers=auth_headers,
        )
        
        # Should handle empty policy path (may use default or fail validation)
        assert response.status_code in [200, 400, 422, 500]

    def test_generate_input_files_openapi_documentation(self, client: TestClient) -> None:
        """Test that OpenAPI documentation includes generate input files endpoint."""
        response = client.get("/openapi.json")
        assert response.status_code == 200
        
        openapi_spec = response.json()
        # Should contain the generate input files endpoint
        assert "/api/v1/jobs/{job_id}/stages/generate-input-files" in str(openapi_spec)

    def test_generate_input_files_api_docs_accessible(self, client: TestClient) -> None:
        """Test that API documentation page is accessible."""
        response = client.get("/docs")
        assert response.status_code == 200
        
        # Check that the page is the Swagger UI documentation
        docs_content = response.text.lower()
        assert "swagger ui" in docs_content
        assert "openapi" in docs_content

    def test_generate_input_files_response_structure(self, client: TestClient, auth_headers: Dict[str, str], created_job: str) -> None:
        """Test that response has correct structure when successful."""
        job_id = created_job
        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/generate-input-files",
            headers=auth_headers,
            json={}
        )

        # If successful, verify response structure
        if response.status_code == 200:
            data = response.json()
            assert "stage_state" in data
            assert data["stage_state"] in ["COMPLETED", "FAILED"]
            
            if data["stage_state"] == "COMPLETED":
                assert "generated_files" in data
                assert isinstance(data["generated_files"], list)

    def test_generate_input_files_error_handling(self, client: TestClient, auth_headers: Dict[str, str], created_job: str) -> None:
        """Test error handling for various error conditions."""
        job_id = created_job
        # Test with invalid policy path
        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/generate-input-files",
            headers=auth_headers,
            json={"adapter_policy_path": "../../../etc/passwd"}
        )
        
        # Should reject path traversal attempts
        assert response.status_code in [400, 422, 500]

    def test_generate_input_files_default_policy_usage(self, client: TestClient, auth_headers: Dict[str, str], created_job: str) -> None:
        """Test that default policy is used when no custom path provided."""
        job_id = created_job
        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/generate-input-files",
            headers=auth_headers,
            json={}  # No policy path - should use default
        )
        
        # Should process the request (may fail due to missing dependencies)
        assert response.status_code in [200, 400, 422, 500]


================================================
FILE: build_stream/tests/integration/api/jobs/conftest.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Shared fixtures for Jobs API integration tests."""

import os
from typing import Dict, Optional

import pytest
from fastapi import Depends, HTTPException, status
from fastapi.security import HTTPAuthorizationCredentials, HTTPBearer
from fastapi.testclient import TestClient

from main import app
from api.dependencies import verify_token
from infra.id_generator import UUIDv4Generator

_bearer = HTTPBearer(auto_error=False)


def _mock_verify_token(
    credentials: Optional[HTTPAuthorizationCredentials] = Depends(_bearer),
):
    """Mock verify_token that uses the token value as client_id."""
    if credentials is None or not credentials.credentials:
        raise HTTPException(
            status_code=status.HTTP_401_UNAUTHORIZED,
            detail={"error": "missing_token", "error_description": "Authorization header is required"},
            headers={"WWW-Authenticate": "Bearer"},
        )
    token = credentials.credentials
    return {
        "client_id": token,
        "client_name": token,
        "scopes": ["job:write", "job:read"],
        "token_id": "test-token-id",
    }


@pytest.fixture(scope="function")
def client():
    """Create test client with mocked JWT auth for business logic tests."""
    app.dependency_overrides[verify_token] = _mock_verify_token
    test_client = TestClient(app)
    yield test_client
    app.dependency_overrides.clear()


@pytest.fixture(scope="function")
def unauth_client():
    """Create test client without auth mock for testing real auth behaviour."""
    return TestClient(app)


@pytest.fixture(name="uuid_generator")
def uuid_generator_fixture():
    """UUID generator for test fixtures."""
    return UUIDv4Generator()


@pytest.fixture
def auth_headers(uuid_generator) -> Dict[str, str]:
    """Standard authentication headers for testing."""
    return {
        "Authorization": "Bearer test-client-123",
        "X-Correlation-Id": str(uuid_generator.generate()),
        "Idempotency-Key": f"test-key-{uuid_generator.generate()}",
    }


@pytest.fixture
def unique_idempotency_key(uuid_generator) -> str:
    """Generate unique idempotency key for each test."""
    return f"test-key-{uuid_generator.generate()}"


@pytest.fixture
def unique_correlation_id(uuid_generator) -> str:
    """Generate unique correlation ID for each test."""
    return str(uuid_generator.generate())


================================================
FILE: build_stream/tests/integration/api/jobs/test_create_job_api.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Integration tests for Jobs create API."""
# pylint: disable=missing-function-docstring

import uuid

class TestCreateJobSuccess:
    """Happy-path create job tests."""

    def test_create_job_returns_201_with_valid_request(self, client, auth_headers):
        payload = {
            "client_id": "client-123",
            "client_name": "test-client",
            "metadata": {"description": "Test job creation"},
        }

        response = client.post("/api/v1/jobs", json=payload, headers=auth_headers)

        assert response.status_code == 201
        data = response.json()
        assert "job_id" in data
        assert "correlation_id" in data
        assert "job_state" in data
        assert "created_at" in data
        assert "stages" in data

    def test_create_job_returns_valid_uuid(self, client, auth_headers):
        payload = {"client_id": "client-123", "client_name": "test-client"}

        response = client.post("/api/v1/jobs", json=payload, headers=auth_headers)

        assert response.status_code == 201
        job_id = response.json()["job_id"]

        # Validate via uuid library to allow any standard UUID version
        parsed = uuid.UUID(job_id)
        assert str(parsed) == job_id.lower()

    def test_create_job_returns_created_state(self, client, auth_headers):
        payload = {"client_id": "client-123", "client_name": "test-client"}

        response = client.post("/api/v1/jobs", json=payload, headers=auth_headers)

        assert response.status_code == 201
        assert response.json()["job_state"] == "CREATED"

    def test_create_job_creates_all_nine_stages(self, client, auth_headers):
        payload = {"client_id": "client-123", "client_name": "test-client"}

        response = client.post("/api/v1/jobs", json=payload, headers=auth_headers)

        assert response.status_code == 201
        stages = response.json()["stages"]
        assert len(stages) == 6

        expected_stages = [
            "parse-catalog",
            "generate-input-files",
            "create-local-repository",
            "build-image-x86_64",
            "build-image-aarch64",
            "validate-image-on-test",
        ]

        stage_names = [s["stage_name"] for s in stages]
        assert stage_names == expected_stages

    def test_create_job_all_stages_pending(self, client, auth_headers):
        payload = {"client_id": "client-123", "client_name": "test-client"}

        response = client.post("/api/v1/jobs", json=payload, headers=auth_headers)

        assert response.status_code == 201
        stages = response.json()["stages"]

        for stage in stages:
            assert stage["stage_state"] == "PENDING"
            assert stage["started_at"] is None
            assert stage["ended_at"] is None
            assert stage["error_code"] is None
            assert stage["error_summary"] is None

    def test_create_job_returns_correlation_id(
        self, client, unique_correlation_id, unique_idempotency_key
    ):
        headers = {
            "Authorization": "Bearer test-client-123",
            "X-Correlation-Id": unique_correlation_id,
            "Idempotency-Key": unique_idempotency_key,
        }
        payload = {"client_id": "client-123", "client_name": "test-client"}

        response = client.post("/api/v1/jobs", json=payload, headers=headers)

        assert response.status_code == 201
        assert response.json()["correlation_id"] == unique_correlation_id


class TestCreateJobIdempotency:
    """Idempotency behavior tests for create job."""

    def test_idempotent_request_returns_200_with_same_job(
        self, client, unique_idempotency_key, unique_correlation_id
    ):
        headers = {
            "Authorization": "Bearer test-client-123",
            "X-Correlation-Id": unique_correlation_id,
            "Idempotency-Key": unique_idempotency_key,
        }
        payload = {"client_id": "client-123", "client_name": "test-client"}

        response1 = client.post("/api/v1/jobs", json=payload, headers=headers)
        assert response1.status_code == 201
        job_id_1 = response1.json()["job_id"]

        response2 = client.post("/api/v1/jobs", json=payload, headers=headers)
        assert response2.status_code == 200
        job_id_2 = response2.json()["job_id"]

        assert job_id_1 == job_id_2

    def test_idempotency_with_different_correlation_id(
        self, client, unique_idempotency_key
    ):
        payload = {"client_id": "client-123", "client_name": "test-client"}

        headers1 = {
            "Authorization": "Bearer test-client-123",
            "X-Correlation-Id": "019bf590-1111-7890-abcd-ef1234567890",
            "Idempotency-Key": unique_idempotency_key,
        }
        response1 = client.post("/api/v1/jobs", json=payload, headers=headers1)
        assert response1.status_code == 201
        job_id_1 = response1.json()["job_id"]

        headers2 = {
            "Authorization": "Bearer test-client-123",
            "X-Correlation-Id": "019bf590-2222-7890-abcd-ef1234567890",
            "Idempotency-Key": unique_idempotency_key,
        }
        response2 = client.post("/api/v1/jobs", json=payload, headers=headers2)
        assert response2.status_code == 200
        job_id_2 = response2.json()["job_id"]

        assert job_id_1 == job_id_2

    # def test_idempotency_conflict_different_payload(
    #     self, client, unique_idempotency_key, unique_correlation_id
    # ):
    #     headers = {
    #         "Authorization": "Bearer test-client-123",
    #         "X-Correlation-Id": unique_correlation_id,
    #         "Idempotency-Key": unique_idempotency_key,
    #     }
    #
    #     payload1 = {"client_name": "client-one"}
    #     response1 = client.post("/api/v1/jobs", json=payload1, headers=headers)
    #     assert response1.status_code == 201
    #
    #     payload2 = {"client_name": "client-two"}
    #     response2 = client.post("/api/v1/jobs", json=payload2, headers=headers)
    #     assert response2.status_code == 409
    #
    #     error_detail = response2.json()["detail"]
    #     assert "IDEMPOTENCY_CONFLICT" in error_detail["error"]


class TestCreateJobValidation:
    """Validation scenarios for create job."""

    def test_missing_client_id_returns_422(self, client, auth_headers):
        """Missing client_id is required and should fail validation."""
        payload = {"client_name": "test-client"}

        response = client.post("/api/v1/jobs", json=payload, headers=auth_headers)

        assert response.status_code == 422

    def test_missing_client_name_is_allowed(self, client, auth_headers):
        """Missing client_name is allowed (field is optional)."""
        payload = {"client_id": "client-123"}

        response = client.post("/api/v1/jobs", json=payload, headers=auth_headers)

        assert response.status_code in [200, 201]

    def test_empty_client_id_returns_422(self, client, auth_headers):
        """Empty client_id should be rejected."""
        payload = {"client_id": ""}

        response = client.post("/api/v1/jobs", json=payload, headers=auth_headers)

        assert response.status_code in [400, 422]

    def test_empty_client_name_returns_400(self, client, auth_headers):
        """Empty client_name should be rejected."""
        payload = {"client_id": "client-123", "client_name": ""}

        response = client.post("/api/v1/jobs", json=payload, headers=auth_headers)

        assert response.status_code in [400, 422]

    def test_client_id_whitespace_only_returns_422(self, client, auth_headers):
        """Whitespace-only client_id should be rejected."""
        payload = {"client_id": "   "}

        response = client.post("/api/v1/jobs", json=payload, headers=auth_headers)

        assert response.status_code in [400, 422]

    def test_client_name_whitespace_only_returns_400(self, client, auth_headers):
        """Whitespace-only client_name should be rejected."""
        payload = {"client_id": "client-123", "client_name": "   "}

        response = client.post("/api/v1/jobs", json=payload, headers=auth_headers)

        assert response.status_code in [400, 422]


class TestCreateJobAuthentication:
    """Authentication header tests."""

    def test_missing_authorization_header_returns_422(self, unauth_client, unique_idempotency_key):
        """Auth header required."""
        headers = {
            "X-Correlation-Id": "019bf590-1234-7890-abcd-ef1234567890",
            "Idempotency-Key": unique_idempotency_key,
        }
        payload = {"client_id": "client-123", "client_name": "test-client"}

        response = unauth_client.post("/api/v1/jobs", json=payload, headers=headers)

        assert response.status_code == 401

    def test_invalid_authorization_format_returns_401(
        self, unauth_client, unique_idempotency_key
    ):
        """Invalid auth scheme returns 401."""
        headers = {
            "Authorization": "InvalidFormat test-token",
            "X-Correlation-Id": "019bf590-1234-7890-abcd-ef1234567890",
            "Idempotency-Key": unique_idempotency_key,
        }
        payload = {"client_id": "client-123", "client_name": "test-client"}

        response = unauth_client.post("/api/v1/jobs", json=payload, headers=headers)

        assert response.status_code == 401

    def test_empty_bearer_token_returns_401(self, unauth_client, unique_idempotency_key):
        """Empty bearer token returns 401."""
        headers = {
            "Authorization": "Bearer ",
            "X-Correlation-Id": "019bf590-1234-7890-abcd-ef1234567890",
            "Idempotency-Key": unique_idempotency_key,
        }
        payload = {"client_id": "client-123", "client_name": "test-client"}

        response = unauth_client.post("/api/v1/jobs", json=payload, headers=headers)

        assert response.status_code == 401


class TestCreateJobHeaders:
    """Header handling tests."""

    def test_missing_idempotency_key_returns_422(self, client):
        """Idempotency key is required."""
        headers = {
            "Authorization": "Bearer test-client-123",
            "X-Correlation-Id": "019bf590-1234-7890-abcd-ef1234567890",
        }
        payload = {"client_id": "client-123", "client_name": "test-client"}

        response = client.post("/api/v1/jobs", json=payload, headers=headers)

        assert response.status_code == 422

    def test_auto_generates_correlation_id_if_missing(
        self, client, unique_idempotency_key
    ):
        """Server should generate correlation ID when absent."""
        headers = {
            "Authorization": "Bearer test-client-123",
            "Idempotency-Key": unique_idempotency_key,
        }
        payload = {"client_id": "client-123", "client_name": "test-client"}

        response = client.post("/api/v1/jobs", json=payload, headers=headers)

        assert response.status_code == 201
        assert "correlation_id" in response.json()
        correlation_id = response.json()["correlation_id"]
        assert len(correlation_id) == 36


================================================
FILE: build_stream/tests/integration/api/jobs/test_delete_job_api.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Integration tests for DELETE job API endpoint."""

# pylint: disable=too-few-public-methods
# pylint: disable=duplicate-code


class TestDeleteJobSuccess:
    """Tests for successful job deletion scenarios."""

    def test_delete_existing_job_returns_204(self, client, auth_headers):
        """Delete existing job should return 204 No Content."""
        create_payload = {"client_id": "client-123", "client_name": "test-client"}
        create_response = client.post("/api/v1/jobs", json=create_payload, headers=auth_headers)
        assert create_response.status_code == 201
        job_id = create_response.json()["job_id"]

        delete_headers = {
            "Authorization": auth_headers["Authorization"],
            "X-Correlation-Id": auth_headers["X-Correlation-Id"],
        }
        delete_response = client.delete(f"/api/v1/jobs/{job_id}", headers=delete_headers)

        assert delete_response.status_code == 204
        assert delete_response.content == b""

    def test_delete_job_is_idempotent(self, client, auth_headers):
        """Delete job should be idempotent - multiple deletes should succeed."""
        create_payload = {"client_id": "client-123", "client_name": "test-client"}
        create_response = client.post("/api/v1/jobs", json=create_payload, headers=auth_headers)
        job_id = create_response.json()["job_id"]

        delete_headers = {
            "Authorization": auth_headers["Authorization"],
            "X-Correlation-Id": auth_headers["X-Correlation-Id"],
        }

        delete_response1 = client.delete(f"/api/v1/jobs/{job_id}", headers=delete_headers)
        assert delete_response1.status_code == 204

        delete_response2 = client.delete(f"/api/v1/jobs/{job_id}", headers=delete_headers)
        assert delete_response2.status_code in [204, 404, 410]

    def test_deleted_job_not_retrievable(self, client, auth_headers):
        """Deleted job should not be retrievable via GET endpoint."""
        create_payload = {"client_id": "client-123", "client_name": "test-client"}
        create_response = client.post("/api/v1/jobs", json=create_payload, headers=auth_headers)
        job_id = create_response.json()["job_id"]

        headers = {
            "Authorization": auth_headers["Authorization"],
            "X-Correlation-Id": auth_headers["X-Correlation-Id"],
        }

        delete_response = client.delete(f"/api/v1/jobs/{job_id}", headers=headers)
        assert delete_response.status_code == 204

        get_response = client.get(f"/api/v1/jobs/{job_id}", headers=headers)
        assert get_response.status_code in [404, 410]


class TestDeleteJobNotFound:
    """Tests for job deletion when job doesn't exist."""

    def test_delete_nonexistent_job_returns_404(self, client, auth_headers):
        """Delete nonexistent job should return 404 Not Found."""
        nonexistent_job_id = "019bf590-1234-7890-abcd-ef1234567890"

        delete_headers = {
            "Authorization": auth_headers["Authorization"],
            "X-Correlation-Id": auth_headers["X-Correlation-Id"],
        }
        response = client.delete(f"/api/v1/jobs/{nonexistent_job_id}", headers=delete_headers)

        assert response.status_code == 404

    def test_delete_job_invalid_uuid_format_returns_400(self, client, auth_headers):
        """Delete job with invalid UUID format should return 400 Bad Request."""
        invalid_job_id = "not-a-valid-uuid"

        delete_headers = {
            "Authorization": auth_headers["Authorization"],
            "X-Correlation-Id": auth_headers["X-Correlation-Id"],
        }
        response = client.delete(f"/api/v1/jobs/{invalid_job_id}", headers=delete_headers)

        assert response.status_code == 400


class TestDeleteJobAuthentication:
    """Tests for authentication in job deletion."""

    def test_delete_job_missing_authorization_returns_422(self, unauth_client, unique_correlation_id):
        """Delete job without auth header should return 401 Unauthorized."""
        job_id = "019bf590-1234-7890-abcd-ef1234567890"
        headers = {"X-Correlation-Id": unique_correlation_id}

        response = unauth_client.delete(f"/api/v1/jobs/{job_id}", headers=headers)

        assert response.status_code == 401

    def test_delete_job_invalid_auth_format_returns_401(
        self, unauth_client, unique_correlation_id
    ):
        """Delete job with invalid auth format should return 401 Unauthorized."""
        job_id = "019bf590-1234-7890-abcd-ef1234567890"
        headers = {
            "Authorization": "InvalidFormat test-token",
            "X-Correlation-Id": unique_correlation_id,
        }

        response = unauth_client.delete(f"/api/v1/jobs/{job_id}", headers=headers)

        assert response.status_code == 401


class TestDeleteJobClientIsolation:
    """Tests for client isolation in job deletion."""

    def test_different_client_cannot_delete_job(
        self, client, unique_idempotency_key, unique_correlation_id
    ):
        """Different client should not be able to delete another client's job."""
        create_headers = {
            "Authorization": "Bearer client-a",
            "X-Correlation-Id": unique_correlation_id,
            "Idempotency-Key": unique_idempotency_key,
        }
        create_payload = {"client_id": "client-123", "client_name": "test-client"}
        create_response = client.post("/api/v1/jobs", json=create_payload, headers=create_headers)
        assert create_response.status_code == 201
        job_id = create_response.json()["job_id"]

        delete_headers = {
            "Authorization": "Bearer client-b",
            "X-Correlation-Id": unique_correlation_id,
        }
        delete_response = client.delete(f"/api/v1/jobs/{job_id}", headers=delete_headers)

        assert delete_response.status_code in [403, 404]

        verify_headers = {
            "Authorization": "Bearer client-a",
            "X-Correlation-Id": unique_correlation_id,
        }
        verify_response = client.get(f"/api/v1/jobs/{job_id}", headers=verify_headers)
        assert verify_response.status_code == 200


================================================
FILE: build_stream/tests/integration/api/jobs/test_get_job_api.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Integration tests for GET job API endpoint."""

# pylint: disable=too-few-public-methods
# pylint: disable=duplicate-code


class TestGetJobSuccess:
    """Tests for successful job retrieval scenarios."""

    def test_get_existing_job_returns_200(self, client, auth_headers):
        """Get existing job should return 200 OK with job details."""
        create_payload = {"client_id": "client-123", "client_name": "test-client"}
        create_response = client.post("/api/v1/jobs", json=create_payload, headers=auth_headers)
        assert create_response.status_code == 201
        job_id = create_response.json()["job_id"]

        get_headers = {
            "Authorization": auth_headers["Authorization"],
            "X-Correlation-Id": auth_headers["X-Correlation-Id"],
        }
        get_response = client.get(f"/api/v1/jobs/{job_id}", headers=get_headers)

        assert get_response.status_code == 200
        data = get_response.json()
        assert data["job_id"] == job_id
        assert "job_state" in data
        assert "created_at" in data
        assert "stages" in data

    def test_get_job_returns_all_stages(self, client, auth_headers):
        """Get job should return all associated stages."""
        create_payload = {"client_id": "client-123", "client_name": "test-client"}
        create_response = client.post("/api/v1/jobs", json=create_payload, headers=auth_headers)
        job_id = create_response.json()["job_id"]

        get_headers = {
            "Authorization": auth_headers["Authorization"],
            "X-Correlation-Id": auth_headers["X-Correlation-Id"],
        }
        get_response = client.get(f"/api/v1/jobs/{job_id}", headers=get_headers)

        assert get_response.status_code == 200
        stages = get_response.json()["stages"]
        assert len(stages) == 10

    def test_get_job_returns_correlation_id(self, client, auth_headers, unique_correlation_id):
        """Get job should return correlation ID from headers."""
        create_payload = {"client_id": "client-123", "client_name": "test-client"}
        create_response = client.post("/api/v1/jobs", json=create_payload, headers=auth_headers)
        job_id = create_response.json()["job_id"]

        get_headers = {
            "Authorization": auth_headers["Authorization"],
            "X-Correlation-Id": unique_correlation_id,
        }
        get_response = client.get(f"/api/v1/jobs/{job_id}", headers=get_headers)

        assert get_response.status_code == 200
        assert get_response.json()["correlation_id"] == unique_correlation_id


class TestGetJobNotFound:
    """Tests for job retrieval when job doesn't exist."""

    def test_get_nonexistent_job_returns_404(self, client, auth_headers):
        """Get nonexistent job should return 404 Not Found."""
        nonexistent_job_id = "019bf590-1234-7890-abcd-ef1234567890"

        get_headers = {
            "Authorization": auth_headers["Authorization"],
            "X-Correlation-Id": auth_headers["X-Correlation-Id"],
        }
        response = client.get(f"/api/v1/jobs/{nonexistent_job_id}", headers=get_headers)

        assert response.status_code == 404

    def test_get_job_invalid_uuid_format_returns_400(self, client, auth_headers):
        """Get job with invalid UUID format should return 400 Bad Request."""
        invalid_job_id = "not-a-valid-uuid"

        get_headers = {
            "Authorization": auth_headers["Authorization"],
            "X-Correlation-Id": auth_headers["X-Correlation-Id"],
        }
        response = client.get(f"/api/v1/jobs/{invalid_job_id}", headers=get_headers)

        assert response.status_code == 400


class TestGetJobAuthentication:
    """Tests for authentication in job retrieval."""

    def test_get_job_missing_authorization_returns_422(self, unauth_client, unique_correlation_id):
        """Get job without auth header should return 401 Unauthorized."""
        job_id = "019bf590-1234-7890-abcd-ef1234567890"
        headers = {"X-Correlation-Id": unique_correlation_id}

        response = unauth_client.get(f"/api/v1/jobs/{job_id}", headers=headers)

        assert response.status_code == 401

    def test_get_job_invalid_authorization_format_returns_401(self, unauth_client, unique_correlation_id):
        """Get job with invalid auth format should return 401 Unauthorized."""
        job_id = "019bf590-1234-7890-abcd-ef1234567890"
        headers = {
            "Authorization": "InvalidFormat test-token",
            "X-Correlation-Id": unique_correlation_id,
        }

        response = unauth_client.get(f"/api/v1/jobs/{job_id}", headers=headers)

        assert response.status_code == 401


class TestGetJobClientIsolation:
    """Tests for client isolation in job retrieval."""

    def test_different_client_cannot_access_job(
        self, client, unique_idempotency_key, unique_correlation_id
    ):
        """Different client should not be able to access another client's job."""
        create_headers = {
            "Authorization": "Bearer client-a",
            "X-Correlation-Id": unique_correlation_id,
            "Idempotency-Key": unique_idempotency_key,
        }
        create_payload = {"client_id": "client-123", "client_name": "test-client"}
        create_response = client.post("/api/v1/jobs", json=create_payload, headers=create_headers)
        assert create_response.status_code == 201
        job_id = create_response.json()["job_id"]

        get_headers = {
            "Authorization": "Bearer client-b",
            "X-Correlation-Id": unique_correlation_id,
        }
        get_response = client.get(f"/api/v1/jobs/{job_id}", headers=get_headers)

        assert get_response.status_code in [403, 404]


class TestGetJobStateMapping:
    """Tests for state mapping and timestamps in job retrieval."""

    def test_get_job_returns_mapped_state_names(self, client, auth_headers):
        """Get job should return API state names (PENDING, RUNNING, SUCCEEDED, FAILED, CLEANED)."""
        create_payload = {"client_id": "client-123", "client_name": "test-client"}
        create_response = client.post("/api/v1/jobs", json=create_payload, headers=auth_headers)
        assert create_response.status_code == 201
        job_id = create_response.json()["job_id"]

        get_headers = {
            "Authorization": auth_headers["Authorization"],
            "X-Correlation-Id": auth_headers["X-Correlation-Id"],
        }
        get_response = client.get(f"/api/v1/jobs/{job_id}", headers=get_headers)

        assert get_response.status_code == 200
        data = get_response.json()
        
        # Verify state is one of the expected API states
        valid_states = ["PENDING", "RUNNING", "SUCCEEDED", "FAILED", "CLEANED"]
        assert data["job_state"] in valid_states

    def test_get_job_returns_state_timestamps(self, client, auth_headers):
        """Get job should return timestamps for state changes."""
        create_payload = {"client_id": "client-123", "client_name": "test-client"}
        create_response = client.post("/api/v1/jobs", json=create_payload, headers=auth_headers)
        assert create_response.status_code == 201
        job_id = create_response.json()["job_id"]

        get_headers = {
            "Authorization": auth_headers["Authorization"],
            "X-Correlation-Id": auth_headers["X-Correlation-Id"],
        }
        get_response = client.get(f"/api/v1/jobs/{job_id}", headers=get_headers)

        assert get_response.status_code == 200
        data = get_response.json()
        
        # Should include state_timestamps field
        assert "state_timestamps" in data
        
        if data["state_timestamps"]:
            # Should include CREATED timestamp at minimum
            assert "CREATED" in data["state_timestamps"]
            # Verify timestamp format (ISO 8601 with Z suffix)
            assert data["state_timestamps"]["CREATED"].endswith("Z")

    def test_get_job_returns_step_breakdown(self, client, auth_headers):
        """Get job should return detailed step breakdown."""
        create_payload = {"client_id": "client-123", "client_name": "test-client"}
        create_response = client.post("/api/v1/jobs", json=create_payload, headers=auth_headers)
        assert create_response.status_code == 201
        job_id = create_response.json()["job_id"]

        get_headers = {
            "Authorization": auth_headers["Authorization"],
            "X-Correlation-Id": auth_headers["X-Correlation-Id"],
        }
        get_response = client.get(f"/api/v1/jobs/{job_id}", headers=get_headers)

        assert get_response.status_code == 200
        data = get_response.json()
        
        # Verify stages structure
        assert "stages" in data
        assert isinstance(data["stages"], list)
        
        # Check stage structure
        for stage in data["stages"]:
            assert "stage_name" in stage
            assert "stage_state" in stage
            assert "started_at" in stage
            assert "ended_at" in stage
            assert "error_code" in stage
            assert "error_summary" in stage


================================================
FILE: build_stream/tests/integration/api/local_repo/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

================================================
FILE: build_stream/tests/integration/api/local_repo/conftest.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Shared fixtures for Local Repository API integration tests."""

import os
from pathlib import Path
from typing import Dict

import pytest
from fastapi.testclient import TestClient
from api.dependencies import verify_token

from main import app
from infra.id_generator import UUIDv4Generator


@pytest.fixture(scope="function")
def client():
    """Create test client with fresh container for each test."""
    os.environ["ENV"] = "dev"

    def mock_verify_token():
        return {
            "sub": "test-client-123",
            "client_id": "test-client-123",
            "scopes": ["job:write", "job:read"]
        }

    app.dependency_overrides[verify_token] = mock_verify_token

    test_client = TestClient(app)

    yield test_client

    # Cleanup
    app.dependency_overrides.clear()


@pytest.fixture(scope="function")
def unauth_client():
    """Create test client without auth mock for testing real auth behaviour."""
    os.environ["ENV"] = "dev"
    return TestClient(app)


@pytest.fixture(name="uuid_generator")
def uuid_generator_fixture():
    """UUID generator for test fixtures."""
    return UUIDv4Generator()


@pytest.fixture(name="auth_headers")
def auth_headers_fixture(uuid_generator) -> Dict[str, str]:
    """Standard authentication headers for testing."""
    return {
        "Authorization": "Bearer test-client-123",
        "X-Correlation-Id": str(uuid_generator.generate()),
        "Idempotency-Key": f"test-key-{uuid_generator.generate()}",
    }


@pytest.fixture
def unique_correlation_id(uuid_generator) -> str:
    """Generate unique correlation ID for each test."""
    return str(uuid_generator.generate())


@pytest.fixture
def created_job(client, auth_headers) -> str:
    """Create a job and return its job_id."""
    payload = {"client_id": "test-client-123", "client_name": "test-client"}
    response = client.post("/api/v1/jobs", json=payload, headers=auth_headers)
    assert response.status_code == 201
    return response.json()["job_id"]


@pytest.fixture
def nfs_queue_dir(tmp_path):
    """Create temporary NFS queue directory structure."""
    requests_dir = tmp_path / "requests"
    results_dir = tmp_path / "results"
    archive_dir = tmp_path / "archive" / "results"
    processing_dir = tmp_path / "processing"

    requests_dir.mkdir(parents=True)
    results_dir.mkdir(parents=True)
    archive_dir.mkdir(parents=True)
    processing_dir.mkdir(parents=True)

    return tmp_path


@pytest.fixture
def input_dir(tmp_path):
    """Create temporary input directory with sample files."""
    base = tmp_path / "build_stream"
    return base


def setup_input_files(input_dir_path: Path, job_id: str) -> Path:
    """Create input files for a given job_id."""
    job_input = input_dir_path / job_id / "input"
    job_input.mkdir(parents=True, exist_ok=True)
    (job_input / "config.json").write_text('{"cluster_os": "rhel9.2"}')
    return job_input


================================================
FILE: build_stream/tests/integration/api/local_repo/test_create_local_repo_api.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Integration tests for Local Repository create API."""

from unittest.mock import patch

from tests.integration.api.local_repo.conftest import setup_input_files


class TestCreateLocalRepoSuccess:
    """Happy-path create local repository tests."""

    def test_returns_202_with_valid_request(
        self, client, auth_headers, created_job, nfs_queue_dir, input_dir
    ):
        setup_input_files(input_dir, created_job)

        with patch(
            "infra.repositories.nfs_input_repository"
            ".NfsInputRepository.get_source_input_repository_path",
            return_value=input_dir / created_job / "input",
        ), patch(
            "infra.repositories.nfs_input_repository"
            ".NfsInputRepository.get_destination_input_repository_path",
            return_value=nfs_queue_dir / "dest_input",
        ), patch(
            "infra.repositories.nfs_input_repository"
            ".NfsInputRepository.validate_input_directory",
            return_value=True,
        ), patch(
            "infra.repositories.nfs_playbook_queue_request_repository"
            ".NfsPlaybookQueueRequestRepository.is_available",
            return_value=True,
        ), patch(
            "infra.repositories.nfs_playbook_queue_request_repository"
            ".NfsPlaybookQueueRequestRepository.write_request",
            return_value=nfs_queue_dir / "requests" / "test.json",
        ):
            response = client.post(
                f"/api/v1/jobs/{created_job}/stages/create-local-repository",
                headers=auth_headers,
            )

        assert response.status_code == 202
        data = response.json()
        assert data["job_id"] == created_job
        assert data["stage"] == "create-local-repository"
        assert data["status"] == "accepted"
        assert "submitted_at" in data
        assert "correlation_id" in data

    def test_returns_correlation_id(
        self, client, created_job, unique_correlation_id,
        nfs_queue_dir, input_dir
    ):
        setup_input_files(input_dir, created_job)
        headers = {
            "Authorization": "Bearer test-client-123",
            "X-Correlation-Id": unique_correlation_id,
        }

        with patch(
            "infra.repositories.nfs_input_repository"
            ".NfsInputRepository.get_source_input_repository_path",
            return_value=input_dir / created_job / "input",
        ), patch(
            "infra.repositories.nfs_input_repository"
            ".NfsInputRepository.get_destination_input_repository_path",
            return_value=nfs_queue_dir / "dest_input",
        ), patch(
            "infra.repositories.nfs_input_repository"
            ".NfsInputRepository.validate_input_directory",
            return_value=True,
        ), patch(
            "infra.repositories.nfs_playbook_queue_request_repository"
            ".NfsPlaybookQueueRequestRepository.is_available",
            return_value=True,
        ), patch(
            "infra.repositories.nfs_playbook_queue_request_repository"
            ".NfsPlaybookQueueRequestRepository.write_request",
            return_value=nfs_queue_dir / "requests" / "test.json",
        ):
            response = client.post(
                f"/api/v1/jobs/{created_job}/stages/create-local-repository",
                headers=headers,
            )

        assert response.status_code == 202
        assert response.json()["correlation_id"] == unique_correlation_id


class TestCreateLocalRepoValidation:
    """Validation scenarios for create local repository."""

    def test_invalid_job_id_returns_400(self, client, auth_headers):
        response = client.post(
            "/api/v1/jobs/invalid-uuid/stages/create-local-repository",
            headers=auth_headers,
        )
        assert response.status_code == 400
        detail = response.json()["detail"]
        assert detail["error"] == "INVALID_JOB_ID"

    def test_nonexistent_job_returns_404(self, client, auth_headers):
        fake_job_id = "018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11"
        response = client.post(
            f"/api/v1/jobs/{fake_job_id}/stages/create-local-repository",
            headers=auth_headers,
        )
        assert response.status_code == 404
        detail = response.json()["detail"]
        assert detail["error"] == "JOB_NOT_FOUND"


class TestCreateLocalRepoAuthentication:
    """Authentication header tests."""

    def test_missing_authorization_returns_422(self, unauth_client):
        headers = {
            "X-Correlation-Id": "019bf590-1234-7890-abcd-ef1234567890",
        }
        response = unauth_client.post(
            "/api/v1/jobs/019bf590-1234-7890-abcd-ef1234567890/stages/create-local-repository",
            headers=headers,
        )
        assert response.status_code == 401

    def test_invalid_authorization_format_returns_401(self, unauth_client):
        headers = {
            "Authorization": "InvalidFormat test-token",
            "X-Correlation-Id": "019bf590-1234-7890-abcd-ef1234567890",
        }
        response = unauth_client.post(
            "/api/v1/jobs/019bf590-1234-7890-abcd-ef1234567890/stages/create-local-repository",
            headers=headers,
        )
        assert response.status_code == 401

    def test_empty_bearer_token_returns_401(self, unauth_client):
        headers = {
            "Authorization": "Bearer ",
            "X-Correlation-Id": "019bf590-1234-7890-abcd-ef1234567890",
        }
        response = unauth_client.post(
            "/api/v1/jobs/019bf590-1234-7890-abcd-ef1234567890/stages/create-local-repository",
            headers=headers,
        )
        assert response.status_code == 401


class TestCreateLocalRepoInputValidation:
    """Input file validation tests."""

    def test_missing_input_files_returns_400(self, client, auth_headers, created_job):
        with patch(
            "infra.repositories.nfs_input_repository"
            ".NfsInputRepository.validate_input_directory",
            return_value=False,
        ):
            response = client.post(
                f"/api/v1/jobs/{created_job}/stages/create-local-repository",
                headers=auth_headers,
            )

        assert response.status_code == 400
        detail = response.json()["detail"]
        assert detail["error"] == "INPUT_FILES_MISSING"


================================================
FILE: build_stream/tests/integration/api/local_repo/test_create_local_repo_edge_cases.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Integration tests for Local Repository create API edge cases."""

import threading
import uuid
from pathlib import Path
from unittest.mock import patch

import pytest

from tests.integration.api.local_repo.conftest import setup_input_files


class TestCreateLocalRepoEdgeCases:
    """Edge case tests for create local repository API."""

    def test_concurrent_requests_same_job(
        self, client, auth_headers, created_job, nfs_queue_dir, input_dir
    ):
        """Test concurrent requests for the same job."""
        # Make multiple concurrent requests
        results = []

        def make_request():
            response = client.post(
                f"/api/v1/jobs/{created_job}/stages/create-local-repository",
                headers=auth_headers,
            )
            results.append(response)

        # Create and start threads
        threads = [threading.Thread(target=make_request) for _ in range(5)]
        for t in threads:
            t.start()
        for t in threads:
            t.join()

        # All should complete (may fail due to input files missing or stage state)
        assert len(results) == 5
        for response in results:
            # Either 202 (accepted), 400 (bad request), 409 (conflict), or 500 (error)
            assert response.status_code in [202, 400, 409, 500]

    def test_request_with_very_long_correlation_id(
        self, client, auth_headers, created_job, nfs_queue_dir, input_dir
    ):
        """Test request with very long correlation ID."""
        # Use a valid UUID but test that validation is working
        long_correlation_id = (
            "019bf590-1234-7890-abcd-ef1234567890"
        )  # Valid UUID format

        response = client.post(
            f"/api/v1/jobs/{created_job}/stages/create-local-repository",
            headers={**auth_headers, "X-Correlation-Id": long_correlation_id},
        )

        # Should handle correlation ID gracefully (may fail if input files missing)
        assert response.status_code in [202, 400]

    def test_request_with_unicode_characters(
        self, client, auth_headers, created_job, nfs_queue_dir, input_dir
    ):
        """Test request with unicode characters in headers."""
        setup_input_files(input_dir, created_job)
        unicode_correlation_id = "测试-🚀-correlation-id"

        # HTTP headers must be ASCII, so this should raise UnicodeEncodeError
        with pytest.raises(UnicodeEncodeError):
            client.post(
                f"/api/v1/jobs/{created_job}/stages/create-local-repository",
                headers={**auth_headers, "X-Correlation-Id": unicode_correlation_id},
            )

    def test_request_when_nfs_queue_full(self, client, auth_headers, created_job, nfs_queue_dir, input_dir):
        """Test request when NFS queue is full."""
        # This test verifies the API handles errors gracefully
        # The actual error code may vary depending on where the error occurs
        response = client.post(
            f"/api/v1/jobs/{created_job}/stages/create-local-repository",
            headers=auth_headers,
        )

        # Should return an error status (400, 500, or 503 are all acceptable)
        assert response.status_code in [400, 500, 503]

    def test_request_with_malformed_authorization_header(self, unauth_client):
        """Test request with malformed authorization header."""
        response = unauth_client.post(
            "/api/v1/jobs/019bf590-1234-7890-abcd-ef1234567890/stages/create-local-repository",
            headers={"Authorization": "InvalidFormat token123"},
        )

        # Should return 401 for invalid auth format
        assert response.status_code == 401

    def test_request_with_expired_job(self, client, auth_headers, created_job, nfs_queue_dir, input_dir):
        """Test request with expired job."""
        response = client.post(
            f"/api/v1/jobs/{created_job}/stages/create-local-repository",
            headers=auth_headers,
        )

        # Should handle job status gracefully (may fail if input files missing or job issues)
        assert response.status_code in [202, 400, 410]

    def test_request_when_input_directory_has_permissions_issue(
        self, client, auth_headers, created_job, nfs_queue_dir, input_dir
    ):
        """Test request when input directory has permission issues."""
        response = client.post(
            f"/api/v1/jobs/{created_job}/stages/create-local-repository",
            headers=auth_headers,
        )

        # Should handle permission issues gracefully (may return various error codes)
        assert response.status_code in [400, 403, 500]

    def test_request_with_multiple_auth_headers(self, unauth_client):
        """Test request with multiple authorization headers."""
        multiple_auth_headers = {
            "Authorization": "Bearer second-token",
            "X-Correlation-Id": "019bf590-1234-7890-abcd-ef1234567890",
        }

        response = unauth_client.post(
            "/api/v1/jobs/019bf590-1234-7890-abcd-ef1234567890/stages/create-local-repository",
            headers=multiple_auth_headers,
        )

        # Unrecognised token returns 401 from real JWT validation
        assert response.status_code in [401, 202, 404, 400]

    def test_request_with_large_request_body(self, client, auth_headers, created_job, nfs_queue_dir, input_dir):
        """Test request with unexpected large body."""
        setup_input_files(input_dir, created_job)
        large_body = "x" * 10000  # 10KB of data

        with patch(
            "infra.repositories.nfs_input_repository"
            ".NfsInputRepository.get_source_input_repository_path",
            return_value=input_dir / created_job / "input",
        ), patch(
            "infra.repositories.nfs_input_repository"
            ".NfsInputRepository.get_destination_input_repository_path",
            return_value=nfs_queue_dir / "dest_input",
        ), patch(
            "infra.repositories.nfs_input_repository"
            ".NfsInputRepository.validate_input_directory",
            return_value=True,
        ), patch(
            "infra.repositories.nfs_playbook_queue_request_repository"
            ".NfsPlaybookQueueRequestRepository.is_available",
            return_value=True,
        ):

            response = client.post(
                f"/api/v1/jobs/{created_job}/stages/create-local-repository",
                headers=auth_headers,
                content=large_body,
            )

            # Should ignore the body (API doesn't expect one) or return 400 for bad request
            assert response.status_code in [202, 400, 422]

    def test_request_with_content_type_header(self, client, auth_headers, created_job):
        """Test request with content-type header."""
        headers_with_content_type = {
            **auth_headers,
            "Content-Type": "application/json",
        }

        response = client.post(
            f"/api/v1/jobs/{created_job}/stages/create-local-repository",
            headers=headers_with_content_type,
        )

        # Should accept the content-type header
        assert response.status_code == 202 or response.status_code == 400


================================================
FILE: build_stream/tests/integration/api/parse_catalog/conftest.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Shared fixtures for Parse Catalog API integration tests."""

import os
from pathlib import Path
from typing import Dict

import pytest

# Use file-based SQLite database for integration tests
@pytest.fixture(scope="function")
def client(tmp_path):
    """Create test client with fresh container for each test."""
    os.environ["ENV"] = "dev"
    # Use file-based SQLite database for integration tests
    db_file = tmp_path / "test.db"
    db_url = f"sqlite:///{db_file}"
    os.environ["DATABASE_URL"] = db_url
    
    # Import app after setting DATABASE_URL
    from main import app

    def mock_verify_token():
        return {
            "sub": "test-client-123",
            "client_id": "test-client-123",
            "scopes": ["job:write", "job:read", "catalog:read", "catalog:write"]
        }

    from api.dependencies import verify_token
    app.dependency_overrides[verify_token] = mock_verify_token
    
    # Create database tables before starting test client
    from infra.db.models import Base
    import infra.db.config as config_module
    import importlib
    
    # Refresh db_config to pick up new DATABASE_URL
    config_module.db_config = config_module.DatabaseConfig()
    
    # Re-import session module to pick up new db_config
    import infra.db.session
    importlib.reload(infra.db.session)
    session_module = infra.db.session
    
    engine = session_module._get_engine()
    Base.metadata.create_all(engine)
    
    from fastapi.testclient import TestClient
    with TestClient(app) as test_client:
        yield test_client

    # Cleanup
    app.dependency_overrides.clear()


@pytest.fixture(name="uuid_generator")
def uuid_generator_fixture():
    """UUID generator for test fixtures."""
    from infra.id_generator import UUIDv4Generator
    return UUIDv4Generator()


@pytest.fixture(name="auth_headers")
def auth_headers_fixture(uuid_generator) -> Dict[str, str]:
    """Standard authentication headers for testing."""
    return {
        "Authorization": "Bearer test-client-123",
        "X-Correlation-Id": str(uuid_generator.generate()),
        "Idempotency-Key": f"test-key-{uuid_generator.generate()}",
    }


@pytest.fixture
def unique_correlation_id(uuid_generator) -> str:
    """Generate unique correlation ID for each test."""
    return str(uuid_generator.generate())


@pytest.fixture
def created_job(client, auth_headers) -> str:
    """Create a job and return its job_id."""
    payload = {"client_id": "test-client-123", "client_name": "test-client"}
    response = client.post("/api/v1/jobs", json=payload, headers=auth_headers)
    assert response.status_code == 201
    return response.json()["job_id"]


================================================
FILE: build_stream/tests/integration/api/parse_catalog/test_parse_catalog_api.py
================================================
"""
ParseCatalog API Integration Tests

Tests the complete API endpoint behavior including:
- File upload via multipart/form-data
- Successful parsing with artifact storage
- Error responses (invalid JSON, schema validation)
- Authentication/authorization
- Cross-stage artifact lookup
"""

import json
import os
import threading
import uuid
from typing import Dict, Any

import pytest

from fastapi.testclient import TestClient

from main import app
from container import DevContainer


class TestParseCatalogAPI:  # pylint: disable=too-many-public-methods
    """Integration tests for ParseCatalog API endpoint."""

    
    @pytest.fixture
    def valid_catalog_json(self) -> Dict[str, Any]:
        """Valid catalog JSON for testing."""
        # Load the actual working catalog from fixtures
        here = os.path.dirname(__file__)
        fixtures_dir = os.path.dirname(os.path.dirname(os.path.dirname(here)))
        catalog_path = os.path.join(fixtures_dir, "fixtures", "catalogs", "functional_layer.json")

        with open(catalog_path, 'r', encoding='utf-8') as f:
            return json.load(f)

    
    def test_parse_catalog_success_happy_path(
        self,
        client: TestClient,
        auth_headers: Dict[str, str],
        created_job: str,
        valid_catalog_json: Dict[str, Any],
    ) -> None:
        """Test successful catalog parsing with artifact storage."""
        job_id = created_job

        # Upload catalog file
        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/parse-catalog",
            files={"file": ("catalog.json", json.dumps(valid_catalog_json), "application/json")},
            headers=auth_headers,
        )

        # Debug: print response details for 422 error
        if response.status_code == 422:
            print(f"422 Error Response: {response.text}")

        assert response.status_code == 200
        data = response.json()

        # Verify response structure based on actual API response
        assert data["status"] == "success"
        assert data["message"] == "Catalog parsed successfully"

    def test_parse_catalog_with_custom_filename(
        self,
        client: TestClient,
        auth_headers: Dict[str, str],
        created_job: str,
        valid_catalog_json: Dict[str, Any],
    ) -> None:
        """Test parsing with custom filename."""
        job_id = created_job

        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/parse-catalog",
            files={
                "file": (
                    "custom_catalog_name.json", 
                    json.dumps(valid_catalog_json),
                    "application/json"
                )
            },
            headers=auth_headers,
        )

        assert response.status_code == 200
        data = response.json()
        assert data["status"] == "success"

    def test_parse_catalog_invalid_json_format(
        self,
        client: TestClient,
        auth_headers: Dict[str, str],
        created_job: str,
    ) -> None:
        """Test parsing with invalid JSON format."""
        job_id = created_job

        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/parse-catalog",
            files={"file": ("test.txt", "not valid json", "text/plain")},
            headers=auth_headers,
        )

        assert response.status_code == 400
        data = response.json()
        assert data["detail"]["error_code"] == "INVALID_FILE_FORMAT"
        assert "Only JSON files are accepted" in data["detail"]["message"]

    def test_parse_catalog_malformed_json(
        self,
        client: TestClient,
        auth_headers: Dict[str, str],
        created_job: str,
    ) -> None:
        """Test parsing with malformed JSON."""
        job_id = created_job

        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/parse-catalog",
            files={"file": ("test.json", '{"invalid": json}', "application/json")},
            headers=auth_headers,
        )

        assert response.status_code == 400
        data = response.json()
        assert data["detail"]["error_code"] == "INVALID_JSON"
        assert "Invalid JSON data" in data["detail"]["message"]

    def test_parse_catalog_schema_validation_error(
        self,
        client: TestClient,
        auth_headers: Dict[str, str],
        created_job: str,
    ) -> None:
        """Test parsing with catalog that fails schema validation."""
        job_id = created_job

        # Catalog missing required fields to trigger schema validation error
        invalid_catalog = {
            "catalog_version": "1.0",
            # Missing required "Catalog" field
            "description": "Invalid catalog"
        }

        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/parse-catalog",
            files={"file": ("test.json", json.dumps(invalid_catalog), "application/json")},
            headers=auth_headers,
        )

        assert response.status_code == 500
        data = response.json()
        assert data["detail"]["error_code"] == "CATALOG_PARSE_ERROR"
        assert "validation" in data["detail"]["message"].lower()

    def test_parse_catalog_file_too_large(
        self,
        client: TestClient,
        auth_headers: Dict[str, str],
        created_job: str,
    ) -> None:
        """Test parsing with file exceeding size limit."""
        job_id = created_job

        # Create a large JSON file (larger than 5MB limit)
        large_catalog = {
            "catalog_version": "1.0",
            "description": "Large catalog",
            "packages": [{"name": f"pkg{i}", "version": "1.0"} for i in range(100000)]
        }

        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/parse-catalog",
            files={"file": ("large.json", json.dumps(large_catalog), "application/json")},
            headers=auth_headers,
        )

        assert response.status_code == 500
        data = response.json()
        assert (
            data["detail"]["error_code"] == "CATALOG_PARSE_ERROR"
            or data["detail"]["error_code"] == "INTERNAL_ERROR"
        )

    def test_parse_catalog_job_not_found(
        self,
        client: TestClient,
        auth_headers: Dict[str, str],
        valid_catalog_json: Dict[str, Any],
    ) -> None:
        """Test parsing with non-existent job ID."""
        fake_job_id = "019bf590-1234-7890-abcd-ef1234567890"

        response = client.post(
            f"/api/v1/jobs/{fake_job_id}/stages/parse-catalog",
            files={"file": ("test.json", json.dumps(valid_catalog_json), "application/json")},
            headers=auth_headers,
        )

        assert response.status_code == 404
        data = response.json()
        assert data["detail"]["error_code"] == "JOB_NOT_FOUND"

    def test_parse_catalog_already_completed(
        self,
        client: TestClient,
        auth_headers: Dict[str, str],
        created_job: str,
        valid_catalog_json: Dict[str, Any],
    ) -> None:
        """Test parsing when stage already completed."""
        job_id = created_job

        # First successful parse
        response1 = client.post(
            f"/api/v1/jobs/{job_id}/stages/parse-catalog",
            files={"file": ("test.json", json.dumps(valid_catalog_json), "application/json")},
            headers=auth_headers,
        )
        assert response1.status_code == 200

        # Second attempt should fail
        response2 = client.post(
            f"/api/v1/jobs/{job_id}/stages/parse-catalog",
            files={"file": ("test2.json", json.dumps(valid_catalog_json), "application/json")},
            headers=auth_headers,
        )

        assert response2.status_code == 409
        data = response2.json()
        assert data["detail"]["error_code"] == "STAGE_ALREADY_COMPLETED"

    def test_parse_catalog_job_in_terminal_state(
        self,
        client: TestClient,
        auth_headers: Dict[str, str],
        created_job: str,
    ) -> None:
        """Test parsing when job is in terminal state."""
        job_id = created_job

        # Try to cancel the job first
        response = client.post(
            f"/api/v1/jobs/{job_id}/cancel",
            headers=auth_headers,
        )

        # If cancel endpoint doesn't exist or fails, skip this test
        if response.status_code not in [200, 204]:
            pytest.skip(f"Cancel endpoint not available or failed: {response.status_code}")

        # Now try to parse catalog
        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/parse-catalog",
            files={"file": ("test.json", "{}", "application/json")},
            headers=auth_headers,
        )

        # Should get 412 if job is in terminal state
        assert response.status_code == 412
        data = response.json()
        assert data["detail"]["error_code"] == "PRECONDITION_FAILED"

    def test_parse_catalog_no_authentication(
        self,
        client: TestClient,
        created_job: str,
        valid_catalog_json: Dict[str, Any],
    ) -> None:
        """Test parsing without authentication header."""
        job_id = created_job

        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/parse-catalog",
            files={"file": ("test.json", json.dumps(valid_catalog_json), "application/json")},
        )

        assert response.status_code == 401
        data = response.json()
        # FastAPI returns detail as dict or string for auth errors
        assert "detail" in data

    def test_parse_catalog_invalid_token(
        self,
        client: TestClient,
        created_job: str,
        valid_catalog_json: Dict[str, Any],
    ) -> None:
        """Test parsing with invalid authentication token."""
        job_id = created_job

        # Note: The mock_jwt_validation fixture bypasses actual JWT validation
        # This test would need real JWT validation to properly test invalid tokens
        # For now, we test that the endpoint requires some form of auth header
        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/parse-catalog",
            files={"file": ("test.json", json.dumps(valid_catalog_json), "application/json")},
            headers={"Authorization": "Bearer invalid-token"},
        )

        # With mock JWT validation, this will succeed (200) instead of 401
        # In production with real JWT validation, this would return 401
        assert response.status_code in [200, 401]
        data = response.json()
        assert "detail" in data or "status" in data

    def test_parse_catalog_invalid_job_id_format(
        self,
        client: TestClient,
        auth_headers: Dict[str, str],
        valid_catalog_json: Dict[str, Any],
    ) -> None:
        """Test parsing with invalid job ID format."""
        response = client.post(
            "/api/v1/jobs/not-a-uuid/stages/parse-catalog",
            files={"file": ("test.json", json.dumps(valid_catalog_json), "application/json")},
            headers=auth_headers,
        )

        assert response.status_code == 400
        data = response.json()
        assert data["detail"]["error_code"] == "VALIDATION_ERROR"

    def test_parse_catalog_no_file_uploaded(
        self,
        client: TestClient,
        auth_headers: Dict[str, str],
        created_job: str,
    ) -> None:
        """Test parsing without uploading a file."""
        job_id = created_job

        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/parse-catalog",
            headers=auth_headers,
        )

        assert response.status_code == 422
        data = response.json()
        # FastAPI validation errors have different format
        assert "detail" in data

    def test_parse_catalog_artifact_storage_verification(
        self,
        client: TestClient,
        auth_headers: Dict[str, str],
        created_job: str,
        valid_catalog_json: Dict[str, Any],
    ) -> None:
        """Test that artifacts are properly stored and can be retrieved."""
        job_id = created_job

        # Parse catalog
        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/parse-catalog",
            files={"file": ("test.json", json.dumps(valid_catalog_json), "application/json")},
            headers=auth_headers,
        )
        assert response.status_code == 200

        data = response.json()

        # Check if artifacts are in the response
        if "artifacts" not in data:
            pytest.skip("Artifacts not included in response - feature may not be fully implemented")

        catalog_ref = data["artifacts"]["catalog_ref"]
        root_jsons_ref = data["artifacts"]["root_jsons_ref"]

        # Verify artifact references
        assert catalog_ref["key"]
        assert catalog_ref["digest"]
        assert catalog_ref["size_bytes"] > 0
        assert catalog_ref["uri"]
        assert catalog_ref["kind"] == "file"

        assert root_jsons_ref["key"]
        assert root_jsons_ref["digest"]
        assert root_jsons_ref["size_bytes"] > 0
        assert root_jsons_ref["uri"]
        assert root_jsons_ref["kind"] == "archive"

    def test_parse_catalog_cross_stage_lookup(
        self,
        client: TestClient,
        auth_headers: Dict[str, str],
        created_job: str,
        valid_catalog_json: Dict[str, Any],
    ) -> None:
        """Test that artifacts can be found by cross-stage lookup."""
        job_id = created_job

        # Parse catalog
        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/parse-catalog",
            files={"file": ("test.json", json.dumps(valid_catalog_json), "application/json")},
            headers=auth_headers,
        )
        assert response.status_code == 200

        # Query artifacts by job and stage
        response = client.get(
            f"/api/v1/jobs/{job_id}/artifacts?stage_name=parse-catalog",
            headers=auth_headers,
        )

        # If artifacts endpoint doesn't exist, skip this test
        if response.status_code == 404:
            pytest.skip("Artifacts query endpoint not implemented yet")

        assert response.status_code == 200
        artifacts = response.json()
        assert len(artifacts) >= 2  # catalog + root-jsons

        # Verify specific artifacts
        labels = [artifact["label"] for artifact in artifacts]
        assert "catalog-file" in labels
        assert "root-jsons" in labels

    def test_parse_catalog_error_sanitization(
        self,
        client: TestClient,
        auth_headers: Dict[str, str],
        created_job: str,
    ) -> None:
        """Test that error responses don't expose internal details."""
        job_id = created_job

        # Send malformed JSON that would cause internal parsing errors
        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/parse-catalog",
            files={"file": ("test.json", '{"unclosed": "string"', "application/json")},
            headers=auth_headers,
        )

        assert response.status_code == 400
        data = response.json()

        # Should not expose stack traces or internal paths
        message = (
            data["detail"]["message"]
            if isinstance(data.get("detail"), dict)
            else str(data.get("detail", ""))
        )
        assert "traceback" not in message.lower()
        assert ".py" not in message

        # Should include correlation ID in nested detail
        if isinstance(data.get("detail"), dict):
            assert "correlation_id" in data["detail"]

    def test_parse_catalog_concurrent_requests(
        self,
        client: TestClient,
        auth_headers: Dict[str, str],
        created_job: str,
        valid_catalog_json: Dict[str, Any],
    ) -> None:
        """Test that concurrent requests to the same job are handled correctly."""
        job_id = created_job

        results = []

        def parse_catalog():
            response = client.post(
                f"/api/v1/jobs/{job_id}/stages/parse-catalog",
                files={"file": ("test.json", json.dumps(valid_catalog_json), "application/json")},
                headers=auth_headers,
            )
            results.append(response.status_code)

        # Start two concurrent requests
        thread1 = threading.Thread(target=parse_catalog)
        thread2 = threading.Thread(target=parse_catalog)

        thread1.start()
        thread2.start()

        thread1.join()
        thread2.join()

        # One should succeed (200), one should fail (409)
        assert 200 in results
        assert 409 in results
        assert len(results) == 2


================================================
FILE: build_stream/tests/integration/api/parse_catalog/test_parse_catalog_artifact_integration.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Integration tests for parse catalog API with artifact storage."""

import json
import os
import shutil
import tempfile
import uuid
import zipfile
from pathlib import Path

from common.config import load_config
from container import container
from core.artifacts.value_objects import ArtifactKind, StoreHint
from core.jobs.value_objects import ClientId, CorrelationId, IdempotencyKey, JobId
from infra.artifact_store.file_artifact_store import FileArtifactStore
from orchestrator.catalog.commands.parse_catalog import ParseCatalogCommand
from orchestrator.jobs.commands import CreateJobCommand


class TestFileArtifactStorage:  # pylint: disable=attribute-defined-outside-init
    """Integration tests for file-based artifact storage."""

    def setup_method(self) -> None:
        """Set up test environment with temporary file store directory."""
        self.temp_file_dir = None
        self.original_env = None
        self.config_file = None

        self.temp_file_dir = tempfile.mkdtemp(prefix="test_file_")
        self.original_env = os.environ.get("BUILD_STREAM_CONFIG_PATH")
        self.config_file = None

        # Create a test config file
        self.config_file = Path(self.temp_file_dir) / "test_config.ini"
        self.config_file.write_text(f"""[artifact_store]
backend = file_store
working_dir = {self.temp_file_dir}/working

[file_store]
base_path = {self.temp_file_dir}/artifacts
""")

        os.environ["BUILD_STREAM_CONFIG_PATH"] = str(self.config_file)

        # Reload container to pick up new config
        container.unwire()
        container.reset_singletons()

    def teardown_method(self) -> None:
        """Clean up test environment."""
        if self.original_env:
            os.environ["BUILD_STREAM_CONFIG_PATH"] = self.original_env
        else:
            os.environ.pop("BUILD_STREAM_CONFIG_PATH", None)

        # Clean up temp directory
        if Path(self.temp_file_dir).exists():
            shutil.rmtree(self.temp_file_dir)

        # Reset container
        container.unwire()
        container.reset_singletons()

    def test_file_artifact_store_is_used_when_enabled(self) -> None:
        """Test that FileArtifactStore is used when enabled in config."""
        artifact_store = container.artifact_store()
        assert isinstance(artifact_store, FileArtifactStore)

    def test_parse_catalog_creates_artifacts_on_file_store(self) -> None:  # pylint: disable=too-many-locals
        """Test that parse catalog creates artifact files on file store."""
        # Load a valid catalog from fixtures
        fixtures_dir = Path(__file__).parent.parent.parent.parent
        catalog_fixture_path = fixtures_dir / "fixtures" / "catalogs" / "catalog_rhel.json"
        with open(catalog_fixture_path, "r", encoding="utf-8") as f:
            catalog_data = json.load(f)

        catalog_bytes = json.dumps(catalog_data).encode('utf-8')

        # Create job first
        create_job_use_case = container.create_job_use_case()
        job_command = CreateJobCommand(
            client_id=ClientId("test-client"),
            request_client_id="test-client",
            correlation_id=CorrelationId(str(uuid.uuid4())),
            idempotency_key=IdempotencyKey(str(uuid.uuid4())),
            client_name="Test Client",
        )
        job_result = create_job_use_case.execute(job_command)
        job_id = JobId(job_result.job_id)

        # Execute parse catalog
        parse_catalog_use_case = container.parse_catalog_use_case()
        command = ParseCatalogCommand(
            job_id=job_id,
            correlation_id=CorrelationId(str(uuid.uuid4())),
            filename="catalog.json",
            content=catalog_bytes,
        )

        result = parse_catalog_use_case.execute(command)

        # Verify result
        assert result.stage_state == "COMPLETED"
        assert result.catalog_ref is not None
        assert result.root_jsons_ref is not None

        # Verify artifacts exist on file store
        file_base = Path(self.temp_file_dir) / "artifacts"

        # Check catalog file exists
        catalog_key = result.catalog_ref.key.value
        catalog_path = file_base / catalog_key
        assert catalog_path.exists(), f"Catalog artifact not found at {catalog_path}"
        assert catalog_path.is_file()

        # Verify catalog content
        catalog_content = catalog_path.read_bytes()
        assert len(catalog_content) > 0

        # Check root JSONs archive exists
        root_jsons_key = result.root_jsons_ref.key.value
        root_jsons_path = file_base / root_jsons_key
        assert root_jsons_path.exists(), f"Root JSONs artifact not found at {root_jsons_path}"
        assert root_jsons_path.is_file()

        # Verify root JSONs archive content
        root_jsons_content = root_jsons_path.read_bytes()
        assert len(root_jsons_content) > 0

        # Verify it's a valid zip file
        with zipfile.ZipFile(root_jsons_path, 'r') as zip_file:
            zip_file.testzip()  # Test zip file integrity
            file_list = zip_file.namelist()
            assert len(file_list) > 0, "Root JSONs archive is empty"
            # Should contain JSON files
            json_files = [f for f in file_list if f.endswith('.json')]
            assert len(json_files) > 0, "No JSON files in root JSONs archive"

    def test_artifact_retrieval_from_file_store(self) -> None:
        """Test that artifacts can be retrieved from file store."""
        artifact_store = container.artifact_store()

        # Store a test artifact
        hint = StoreHint(
            namespace="test",
            label="test-file",
            tags={"test_id": str(uuid.uuid4())},
        )

        test_content = b"Test artifact content"

        ref = artifact_store.store(
            hint=hint,
            kind=ArtifactKind.FILE,
            content=test_content,
            content_type="text/plain",
        )

        # Verify artifact exists on file store
        file_base = Path(self.temp_file_dir) / "artifacts"
        artifact_path = file_base / ref.key.value
        assert artifact_path.exists()

        # Retrieve artifact
        retrieved_content = artifact_store.retrieve(
            key=ref.key,
            kind=ArtifactKind.FILE,
        )

        assert retrieved_content == test_content

    def test_artifact_deletion_from_file_store(self) -> None:
        """Test that artifacts can be deleted from file store."""
        artifact_store = container.artifact_store()

        # Store a test artifact
        hint = StoreHint(
            namespace="test",
            label="test-delete",
            tags={"test_id": str(uuid.uuid4())},
        )

        ref = artifact_store.store(
            hint=hint,
            kind=ArtifactKind.FILE,
            content=b"To be deleted",
            content_type="text/plain",
        )

        # Verify artifact exists
        file_base = Path(self.temp_file_dir) / "artifacts"
        artifact_path = file_base / ref.key.value
        assert artifact_path.exists()

        # Delete artifact
        deleted = artifact_store.delete(ref.key)
        assert deleted is True

        # Verify artifact is gone
        assert not artifact_path.exists()

    def test_working_dir_is_used_for_temp_files(self) -> None:
        """Test that working_dir from config is used for temporary files."""
        config = load_config()
        working_dir = Path(config.artifact_store.working_dir)

        # Verify it's the temp directory we configured
        assert str(working_dir) == f"{self.temp_file_dir}/working"

        # Create working directory if it doesn't exist (simulates what the service does)
        working_dir.mkdir(parents=True, exist_ok=True)

        # Verify working directory exists
        assert working_dir.exists()
        assert working_dir.is_dir()

    def test_archive_artifact_storage_on_file_store(self) -> None:
        """Test that archive artifacts are stored correctly on file store."""
        artifact_store = container.artifact_store()

        # Create a file map for archive
        file_map = {
            "file1.txt": b"Content of file 1",
            "subdir/file2.txt": b"Content of file 2",
            "subdir/file3.json": b'{"key": "value"}',
        }

        hint = StoreHint(
            namespace="test",
            label="test-archive",
            tags={"test_id": str(uuid.uuid4())},
        )

        ref = artifact_store.store(
            hint=hint,
            kind=ArtifactKind.ARCHIVE,
            file_map=file_map,
            content_type="application/zip",
        )

        # Verify archive exists on file store
        file_base = Path(self.temp_file_dir) / "artifacts"
        archive_path = file_base / ref.key.value
        assert archive_path.exists()
        assert archive_path.suffix == ".zip"

        # Retrieve and verify archive contents
        temp_extract_dir = Path(tempfile.mkdtemp(prefix="test_extract_"))

        try:
            extracted_path = artifact_store.retrieve(
                key=ref.key,
                kind=ArtifactKind.ARCHIVE,
                destination=temp_extract_dir,
            )

            # Verify all files were extracted
            assert (extracted_path / "file1.txt").exists()
            assert (extracted_path / "subdir" / "file2.txt").exists()
            assert (extracted_path / "subdir" / "file3.json").exists()

            # Verify content
            assert (extracted_path / "file1.txt").read_bytes() == b"Content of file 1"
        finally:
            if temp_extract_dir.exists():
                shutil.rmtree(temp_extract_dir)


================================================
FILE: build_stream/tests/integration/api/parse_catalog/test_parse_catalog_routes.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Integration tests for Parse Catalog API routes."""

import json
import uuid
from unittest.mock import MagicMock, patch

import pytest
from fastapi.testclient import TestClient

from main import app


class TestParseCatalogRoutes:
    """Integration tests for parse catalog API endpoints."""

    def setup_method(self) -> None:
        """Set up test client."""
        self.client = TestClient(app)
        self.valid_job_id = str(uuid.uuid4())
        self.valid_correlation_id = str(uuid.uuid4())
        self.valid_headers = {
            "Authorization": "Bearer test-token",
            "X-Correlation-ID": self.valid_correlation_id,
        }

    def test_parse_catalog_endpoint_exists(self) -> None:
        """Test that the parse catalog endpoint exists and is accessible."""
        # Test with invalid auth to check endpoint exists (should get 401, not 404)
        response = self.client.post(
            f"/api/v1/jobs/{self.valid_job_id}/stages/parse-catalog",
            files={"catalog": ("catalog.json", b"{}", "application/json")},
            headers={"Authorization": "Bearer invalid-token"},
        )
        
        # Should not be 404 (endpoint exists)
        assert response.status_code != 404
        # Should be 401 (auth required) or 422 (validation error)
        assert response.status_code in [401, 422]

    def test_parse_catalog_with_valid_request_structure(self, mock_jwt_validation) -> None:
        """Test parse catalog with valid request structure."""
        valid_catalog = {
            "Catalog": {
                "Name": "Test Catalog",
                "Version": "1.0.0",
                "FunctionalLayer": "test-functional",
                "BaseOS": "test-os",
                "Infrastructure": "test-infra",
                "FunctionalPackages": {},
                "OSPackages": {},
                "InfrastructurePackages": {},
                "DriverPackages": {}
            }
        }

        with patch('api.parse_catalog.service.ParseCatalogService') as mock_service:
            # Mock the service to return a successful result
            mock_instance = MagicMock()
            mock_instance.execute.return_value = MagicMock(
                stage_state="COMPLETED",
                catalog_ref=MagicMock(),
                root_json_ref=MagicMock(),
            )
            mock_service.return_value = mock_instance

            response = self.client.post(
                f"/api/v1/jobs/{self.valid_job_id}/stages/parse-catalog",
                files={"catalog": ("catalog.json", json.dumps(valid_catalog), "application/json")},
                headers=self.valid_headers,
            )

            # The response should be successful if mocking works correctly
            # If not, we at least verify the endpoint structure is correct
            assert response.status_code in [200, 201, 400, 422, 500]

    def test_parse_catalog_requires_authentication(self) -> None:
        """Test that parse catalog endpoint requires authentication."""
        response = self.client.post(
            f"/api/v1/jobs/{self.valid_job_id}/stages/parse-catalog",
            files={"catalog": ("catalog.json", b"{}", "application/json")},
        )
        
        # Should require authentication
        assert response.status_code == 401

    def test_parse_catalog_requires_correlation_id(self, mock_jwt_validation) -> None:
        """Test that parse catalog endpoint requires correlation ID."""
        response = self.client.post(
            f"/api/v1/jobs/{self.valid_job_id}/stages/parse-catalog",
            files={"catalog": ("catalog.json", b"{}", "application/json")},
            headers={"Authorization": "Bearer test-token"},
        )
        
        # Should require correlation ID
        assert response.status_code == 422

    def test_parse_catalog_invalid_job_id_format(self, mock_jwt_validation) -> None:
        """Test parse catalog with invalid job ID format."""
        response = self.client.post(
            "/api/v1/jobs/invalid-uuid/stages/parse-catalog",
            files={"catalog": ("catalog.json", b"{}", "application/json")},
            headers={"Authorization": "Bearer test-token", "X-Correlation-ID": self.valid_correlation_id},
        )
        
        # Should validate job ID format
        assert response.status_code == 422

    def test_parse_catalog_missing_file_parameter(self, mock_jwt_validation) -> None:
        """Test parse catalog without file parameter."""
        response = self.client.post(
            f"/api/v1/jobs/{self.valid_job_id}/stages/parse-catalog",
            headers={"Authorization": "Bearer test-token", "X-Correlation-ID": self.valid_correlation_id},
        )
        
        # Should require file parameter
        assert response.status_code == 422

    def test_parse_catalog_invalid_file_format(self, mock_jwt_validation) -> None:
        """Test parse catalog with invalid file format."""
        response = self.client.post(
            f"/api/v1/jobs/{self.valid_job_id}/stages/parse-catalog",
            files={"catalog": ("catalog.txt", b"not json", "text/plain")},
            headers={"Authorization": "Bearer test-token", "X-Correlation-ID": self.valid_correlation_id},
        )
        
        # Should validate file format
        assert response.status_code in [400, 422]

    def test_parse_catalog_invalid_json_content(self, mock_jwt_validation) -> None:
        """Test parse catalog with invalid JSON content."""
        response = self.client.post(
            f"/api/v1/jobs/{self.valid_job_id}/stages/parse-catalog",
            files={"catalog": ("catalog.json", b"invalid json", "application/json")},
            headers={"Authorization": "Bearer test-token", "X-Correlation-ID": self.valid_correlation_id},
        )
        
        # Should validate JSON content
        assert response.status_code in [400, 422]

    def test_parse_catalog_oversized_file(self, mock_jwt_validation) -> None:
        """Test parse catalog with oversized file."""
        # Create a large JSON payload (over 5MB)
        large_content = b'{"test": "' + b'x' * (5 * 1024 * 1024) + b'"}'
        
        response = self.client.post(
            f"/api/v1/jobs/{self.valid_job_id}/stages/parse-catalog",
            files={"catalog": ("catalog.json", large_content, "application/json")},
            headers={"Authorization": "Bearer test-token", "X-Correlation-ID": self.valid_correlation_id},
        )
        
        # Should reject oversized files
        assert response.status_code in [400, 422, 413]

    def test_parse_catalog_openapi_documentation(self) -> None:
        """Test that parse catalog endpoint is documented in OpenAPI."""
        pytest.skip("OpenAPI documentation not yet implemented")
        response = self.client.get("/openapi.json")
        assert response.status_code == 200
        
        openapi_spec = response.json()
        paths = openapi_spec.get("paths", {})
        
        # Check if parse catalog endpoint is documented
        parse_catalog_paths = [
            path for path in paths.keys() 
            if "parse-catalog" in path and "POST" in paths[path]
        ]
        
        assert len(parse_catalog_paths) > 0, "Parse catalog endpoint not found in OpenAPI docs"
        
        # Verify the endpoint documentation
        for path in parse_catalog_paths:
            endpoint_spec = paths[path]["POST"]
            assert "summary" in endpoint_spec
            assert "requestBody" in endpoint_spec
            assert "responses" in endpoint_spec

    def test_parse_catalog_api_docs_accessible(self) -> None:
        """Test that API documentation page is accessible."""
        pytest.skip("OpenAPI documentation not yet implemented")
        response = self.client.get("/docs")
        assert response.status_code == 200
        
        # Check that the page contains the parse catalog endpoint
        docs_content = response.text
        assert "parse-catalog" in docs_content.lower()

    @patch('api.parse_catalog.service.ParseCatalogService')
    def test_parse_catalog_service_integration(self, mock_service, mock_jwt_validation) -> None:
        """Test integration with ParseCatalogService."""
        # Mock service to return a realistic response
        mock_instance = MagicMock()
        mock_instance.execute.return_value = MagicMock(
            stage_state="COMPLETED",
            catalog_ref=MagicMock(
                key="catalog/test-job/catalog.json",
                digest="a" * 64,  # SHA-256 hash
                size_bytes=1024,
                uri="memory://catalog/test-job/catalog.json"
            ),
            root_json_ref=MagicMock(
                key="catalog/test-job/root.json",
                digest="b" * 64,  # SHA-256 hash
                size_bytes=512,
                uri="memory://catalog/test-job/root.json"
            ),
        )
        mock_service.return_value = mock_instance

        valid_catalog = {
            "Catalog": {
                "Name": "Test Catalog",
                "Version": "1.0.0",
                "FunctionalLayer": "test-functional",
                "BaseOS": "test-os",
                "Infrastructure": "test-infra",
                "FunctionalPackages": {},
                "OSPackages": {},
                "InfrastructurePackages": {},
                "DriverPackages": {}
            }
        }

        response = self.client.post(
            f"/api/v1/jobs/{self.valid_job_id}/stages/parse-catalog",
            files={"catalog": ("catalog.json", json.dumps(valid_catalog), "application/json")},
            headers=self.valid_headers,
        )

        # If mocking works, should get successful response
        if response.status_code == 200:
            response_data = response.json()
            assert "stage_state" in response_data
            assert response_data["stage_state"] == "COMPLETED"
            assert "catalog_ref" in response_data
            assert "root_json_ref" in response_data


================================================
FILE: build_stream/tests/integration/api/validate/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Integration tests for ValidateImageOnTest API."""


================================================
FILE: build_stream/tests/integration/api/validate/conftest.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Shared fixtures for ValidateImageOnTest API integration tests."""

import os
from pathlib import Path
from typing import Dict

import pytest

from fastapi.testclient import TestClient
from api.dependencies import verify_token

from infra.id_generator import UUIDv4Generator
from core.jobs.value_objects import StageState


@pytest.fixture(scope="function")
def client(tmp_path):
    """Create test client with fresh container for each test."""
    os.environ["ENV"] = "dev"
    # Use file-based SQLite database for integration tests
    db_file = tmp_path / "test.db"
    db_url = f"sqlite:///{db_file}"
    os.environ["DATABASE_URL"] = db_url
    
    # Import app after setting DATABASE_URL
    from main import app

    def mock_verify_token():
        return {
            "sub": "test-client-123",
            "client_id": "test-client-123",
            "scopes": ["job:write", "job:read"]
        }

    app.dependency_overrides[verify_token] = mock_verify_token
    
    # Create database tables before starting test client
    from infra.db.models import Base
    import infra.db.config as config_module
    import importlib
    
    # Refresh db_config to pick up new DATABASE_URL
    config_module.db_config = config_module.DatabaseConfig()
    
    # Re-import session module to pick up new db_config
    import infra.db.session
    importlib.reload(infra.db.session)
    session_module = infra.db.session
    
    engine = session_module._get_engine()
    Base.metadata.create_all(engine)
    
    with TestClient(app) as test_client:
        yield test_client

    # Cleanup
    app.dependency_overrides.clear()


@pytest.fixture(name="uuid_generator")
def uuid_generator_fixture():
    """UUID generator for test fixtures."""
    return UUIDv4Generator()


@pytest.fixture(name="auth_headers")
def auth_headers_fixture(uuid_generator) -> Dict[str, str]:
    """Standard authentication headers for testing."""
    return {
        "Authorization": "Bearer test-client-123",
        "X-Correlation-Id": str(uuid_generator.generate()),
        "Idempotency-Key": f"test-key-{uuid_generator.generate()}",
    }


@pytest.fixture
def unique_correlation_id(uuid_generator) -> str:
    """Generate unique correlation ID for each test."""
    return str(uuid_generator.generate())


@pytest.fixture
def created_job(client, auth_headers) -> str:
    """Create a job and return its job_id."""
    payload = {"client_id": "test-client-123", "client_name": "test-client"}
    response = client.post("/api/v1/jobs", json=payload, headers=auth_headers)
    assert response.status_code == 201
    return response.json()["job_id"]


@pytest.fixture
def job_with_completed_build_image(client, auth_headers, created_job, monkeypatch) -> str:
    """Create a job with a completed build-image stage."""
    from core.jobs.entities import Stage
    from core.jobs.value_objects import JobId, StageName, StageType
    
    # Mock the stage repository to return a completed build-image stage
    def mock_find_by_job_and_name(self, job_id, stage_name):
        # Handle JobId objects or string job_id
        job_id_str = str(job_id)
        
        if stage_name.value == StageType.BUILD_IMAGE_X86_64.value:
            stage = Stage(
                job_id=JobId(job_id_str),
                stage_name=StageName(StageType.BUILD_IMAGE_X86_64.value),
                stage_state=StageState.COMPLETED,
                attempt=1
            )
            return stage
        elif stage_name.value == StageType.VALIDATE_IMAGE_ON_TEST.value:
            stage = Stage(
                job_id=JobId(job_id_str),
                stage_name=StageName(StageType.VALIDATE_IMAGE_ON_TEST.value),
                stage_state=StageState.PENDING,
                attempt=1
            )
            return stage
        return None
    
    # Apply the mock - in dev mode, it uses container's stage repository
    from container import container
    monkeypatch.setattr(
        container.stage_repository().__class__,
        "find_by_job_and_name",
        mock_find_by_job_and_name
    )
    
    return created_job


@pytest.fixture
def nfs_queue_dir(tmp_path):
    """Create temporary NFS queue directory structure."""
    requests_dir = tmp_path / "requests"
    results_dir = tmp_path / "results"
    archive_dir = tmp_path / "archive" / "results"
    processing_dir = tmp_path / "processing"

    requests_dir.mkdir(parents=True)
    results_dir.mkdir(parents=True)
    archive_dir.mkdir(parents=True)
    processing_dir.mkdir(parents=True)

    return tmp_path


================================================
FILE: build_stream/tests/integration/api/validate/test_models.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Test-specific database models with SQLite-compatible types."""

import uuid
from datetime import datetime

from sqlalchemy import (
    Column,
    DateTime,
    ForeignKey,
    Index,
    Integer,
    String,
    Text,
    func,
    JSON,
)
from sqlalchemy.orm import declarative_base, relationship

Base = declarative_base()


class Job(Base):
    """Job model."""

    __tablename__ = "jobs"

    # Primary key
    job_id = Column(String(36), primary_key=True)

    # Business attributes
    client_id = Column(String(128), nullable=False, index=True)

    # Timestamps
    created_at = Column(DateTime(timezone=True), server_default=func.now(), nullable=False)
    updated_at = Column(DateTime(timezone=True), server_default=func.now(), onupdate=func.now(), nullable=False)

    # Relationships
    stages = relationship("Stage", back_populates="job", cascade="all, delete-orphan")
    audit_events = relationship("AuditEvent", back_populates="job", cascade="all, delete-orphan")
    idempotency_records = relationship("IdempotencyRecord", back_populates="job", cascade="all, delete-orphan")
    artifact_records = relationship("ArtifactRecord", back_populates="job", cascade="all, delete-orphan")


class Stage(Base):
    """Stage model."""

    __tablename__ = "stages"

    # Primary key
    id = Column(Integer, primary_key=True, autoincrement=True)

    # Foreign key
    job_id = Column(String(36), ForeignKey("jobs.job_id", ondelete="CASCADE"), nullable=False, index=True)

    # Business attributes
    stage_name = Column(String(50), nullable=False)
    stage_state = Column(String(20), nullable=False)
    error_code = Column(String(100), nullable=True)
    error_summary = Column(String(256), nullable=True)
    error_details = Column(Text, nullable=True)

    # Timestamp
    timestamp = Column(DateTime(timezone=True), server_default=func.now(), nullable=False)

    # Relationships
    job = relationship("Job", back_populates="stages")

    # Composite indexes
    __table_args__ = (
        Index("ix_stage_job_name", "job_id", "stage_name"),
        Index("ix_stage_state", "stage_state"),
    )


class AuditEvent(Base):
    """Audit event model."""

    __tablename__ = "audit_events"

    # Primary key
    id = Column(Integer, primary_key=True, autoincrement=True)

    # Foreign key
    job_id = Column(String(36), ForeignKey("jobs.job_id", ondelete="CASCADE"), nullable=False, index=True)

    # Business attributes
    event_type = Column(String(50), nullable=False)
    correlation_id = Column(String(36), nullable=True)

    # Timestamp
    timestamp = Column(DateTime(timezone=True), nullable=False, index=True)

    # Event details
    details = Column(JSON, nullable=True)

    # Composite indexes
    __table_args__ = (
        Index("ix_audit_job_timestamp", "job_id", "timestamp"),
        Index("ix_audit_correlation", "correlation_id"),
    )

    # Relationships
    job = relationship("Job", back_populates="audit_events")


class IdempotencyRecord(Base):
    """Idempotency record model."""

    __tablename__ = "idempotency_keys"

    # Primary key
    id = Column(Integer, primary_key=True, autoincrement=True)

    # Business attributes
    idempotency_key = Column(String(255), nullable=False, unique=True, index=True)
    job_id = Column(String(36), ForeignKey("jobs.job_id", ondelete="CASCADE"), nullable=False, index=True)
    request_fingerprint = Column(String(64), nullable=False, index=True)
    client_id = Column(String(128), nullable=False, index=True)

    # Timestamps
    created_at = Column(DateTime(timezone=True), server_default=func.now(), nullable=False)
    expires_at = Column(DateTime(timezone=True), nullable=False, index=True)

    # Relationships
    job = relationship("Job", back_populates="idempotency_records")


class ArtifactRecord(Base):
    """Artifact record model."""

    __tablename__ = "artifacts"

    # Primary key
    id = Column(String(36), primary_key=True, default=lambda: str(uuid.uuid4()))

    # Foreign key
    job_id = Column(String(36), ForeignKey("jobs.job_id", ondelete="CASCADE"), nullable=False, index=True)

    # Business attributes
    stage_name = Column(String(50), nullable=False)
    label = Column(String(100), nullable=False)
    artifact_ref = Column(JSON, nullable=False)
    kind = Column(String(20), nullable=False)
    content_type = Column(String(100), nullable=False)
    tags = Column(JSON, nullable=True)

    # Timestamp
    created_at = Column(DateTime(timezone=True), server_default=func.now(), nullable=False)

    # Relationships
    job = relationship("Job", back_populates="artifact_records")


class StageLock(Base):
    """Stage lock model for concurrency control."""

    __tablename__ = "stage_locks"

    # Primary key
    stage_name = Column(String(50), primary_key=True)

    # Lock attributes
    locked_at = Column(DateTime(timezone=True), server_default=func.now(), nullable=False)
    locked_by = Column(String(128), nullable=False)
    expires_at = Column(DateTime(timezone=True), nullable=False, index=True)


================================================
FILE: build_stream/tests/integration/api/validate/test_validate_image_on_test_api.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Integration tests for ValidateImageOnTest API."""

import json
from pathlib import Path
from unittest.mock import patch


class TestValidateImageOnTestSuccess:
    """Happy-path validate image on test tests."""

    def test_returns_202_with_valid_request(
        self, client, auth_headers, job_with_completed_build_image, nfs_queue_dir
    ):
        """Test successful validate image on test request."""
        with patch(
            "infra.repositories.nfs_playbook_queue_request_repository"
            ".NfsPlaybookQueueRequestRepository.is_available",
            return_value=True,
        ), patch(
            "infra.repositories.nfs_playbook_queue_request_repository"
            ".NfsPlaybookQueueRequestRepository.write_request",
            return_value=nfs_queue_dir / "requests" / "test.json",
        ):
            response = client.post(
                f"/api/v1/jobs/{job_with_completed_build_image}/stages/validate-image-on-test",
                headers=auth_headers,
                json={"image_key": "test-image-key"},
            )

        assert response.status_code == 202
        data = response.json()
        assert data["job_id"] == job_with_completed_build_image
        assert data["stage"] == "validate-image-on-test"
        assert data["status"] == "accepted"
        assert "submitted_at" in data
        assert "correlation_id" in data

    def test_returns_correlation_id(
        self, client, job_with_completed_build_image, unique_correlation_id,
        nfs_queue_dir
    ):
        """Test that correlation ID is returned in response."""
        headers = {
            "Authorization": "Bearer test-client-123",
            "X-Correlation-Id": unique_correlation_id,
            "Idempotency-Key": f"test-key-{uuid.uuid4()}",
        }
        
        with patch(
            "infra.repositories.nfs_playbook_queue_request_repository"
            ".NfsPlaybookQueueRequestRepository.is_available",
            return_value=True,
        ), patch(
            "infra.repositories.nfs_playbook_queue_request_repository"
            ".NfsPlaybookQueueRequestRepository.write_request",
            return_value=nfs_queue_dir / "requests" / "test.json",
        ):
            response = client.post(
                f"/api/v1/jobs/{job_with_completed_build_image}/stages/validate-image-on-test",
                headers=headers,
                json={"image_key": "test-image-key"},
            )

        assert response.status_code == 202
        data = response.json()
        assert data["correlation_id"] == unique_correlation_id

    def test_queue_submission(
        self, client, auth_headers, job_with_completed_build_image, nfs_queue_dir, monkeypatch
    ):
        """Test that validate request is submitted to queue."""
        # Create a mock for the queue service that tracks submissions
        mock_submissions = []
        
        def mock_write_request(self, request):
            mock_submissions.append(request)
            return f"/mock/path/{request.job_id}_{request.stage_name}.json"
        
        # Apply the mock
        monkeypatch.setattr(
            "infra.repositories.nfs_playbook_queue_request_repository.NfsPlaybookQueueRequestRepository.write_request",
            mock_write_request
        )
        monkeypatch.setattr(
            "infra.repositories.nfs_playbook_queue_request_repository.NfsPlaybookQueueRequestRepository.is_available",
            lambda self: True
        )
        
        # Make the request
        response = client.post(
            f"/api/v1/jobs/{job_with_completed_build_image}/stages/validate-image-on-test",
            headers=auth_headers,
            json={"image_key": "test-image-key"},
        )
        
        # Verify response
        assert response.status_code == 202
        
        # Verify a request was submitted
        assert len(mock_submissions) == 1
        submitted_request = mock_submissions[0]
        
        # Verify request properties
        assert submitted_request.job_id == job_with_completed_build_image
        assert submitted_request.stage_name == "validate-image-on-test"
        assert str(submitted_request.playbook_path) == "discovery.yml"


class TestValidateImageOnTestValidation:
    """Validation scenarios for validate image on test."""

    def test_invalid_job_id_returns_400(self, client, auth_headers):
        """Test validate image with invalid job ID format."""
        response = client.post(
            "/api/v1/jobs/invalid-uuid/stages/validate-image-on-test",
            headers=auth_headers,
            json={"image_key": "test-image-key"},
        )
        assert response.status_code == 400
        detail = response.json()["detail"]
        assert detail["error"] == "INVALID_JOB_ID"

    def test_nonexistent_job_returns_404(self, client, auth_headers):
        """Test validate image with non-existent job ID."""
        fake_job_id = "018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11"
        response = client.post(
            f"/api/v1/jobs/{fake_job_id}/stages/validate-image-on-test",
            headers=auth_headers,
            json={"image_key": "test-image-key"},
        )
        assert response.status_code == 404
        detail = response.json()["detail"]
        assert detail["error"] == "JOB_NOT_FOUND"

    def test_stage_guard_violation_returns_412(
        self, client, auth_headers, created_job
    ):
        """Test validate image without completed build-image stage."""
        response = client.post(
            f"/api/v1/jobs/{created_job}/stages/validate-image-on-test",
            headers=auth_headers,
            json={"image_key": "test-image-key"},
        )
        assert response.status_code == 412
        detail = response.json()["detail"]
        assert detail["error"] == "STAGE_GUARD_VIOLATION"
        assert "build-image" in detail["message"]


class TestValidateImageOnTestAuthentication:
    """Authentication header tests."""

    def test_missing_authorization_returns_422(
        self, client, job_with_completed_build_image
    ):
        """Test validate image without authorization header."""
        headers = {
            "X-Correlation-Id": "019bf590-1234-7890-abcd-ef1234567890",
        }
        response = client.post(
            f"/api/v1/jobs/{job_with_completed_build_image}/stages/validate-image-on-test",
            headers=headers,
            json={"image_key": "test-image-key"},
        )
        assert response.status_code == 422

    def test_invalid_authorization_format_returns_401(
        self, client, job_with_completed_build_image
    ):
        """Test validate image with invalid authorization format."""
        headers = {
            "Authorization": "InvalidFormat test-token",
            "X-Correlation-Id": "019bf590-1234-7890-abcd-ef1234567890",
        }
        response = client.post(
            f"/api/v1/jobs/{job_with_completed_build_image}/stages/validate-image-on-test",
            headers=headers,
            json={"image_key": "test-image-key"},
        )
        assert response.status_code == 401

    def test_empty_bearer_token_returns_401(
        self, client, job_with_completed_build_image
    ):
        """Test validate image with empty bearer token."""
        headers = {
            "Authorization": "Bearer ",
            "X-Correlation-Id": "019bf590-1234-7890-abcd-ef1234567890",
        }
        response = client.post(
            f"/api/v1/jobs/{job_with_completed_build_image}/stages/validate-image-on-test",
            headers=headers,
            json={"image_key": "test-image-key"},
        )
        assert response.status_code == 401


class TestValidateImageOnTestErrorHandling:
    """Error handling tests."""

    def test_queue_unavailable_returns_500(
        self, client, auth_headers, job_with_completed_build_image, monkeypatch
    ):
        """Test validate image when queue is unavailable."""
        # Mock the queue service to be unavailable
        monkeypatch.setattr(
            "infra.repositories.nfs_playbook_queue_request_repository.NfsPlaybookQueueRequestRepository.is_available",
            lambda self: False
        )
        
        response = client.post(
            f"/api/v1/jobs/{job_with_completed_build_image}/stages/validate-image-on-test",
            headers=auth_headers,
            json={"image_key": "test-image-key"},
        )
        assert response.status_code == 500
        detail = response.json()["detail"]
        assert detail["error"] == "VALIDATION_EXECUTION_ERROR"
        # The actual error message might vary, so we don't assert on it


================================================
FILE: build_stream/tests/integration/conftest.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Pytest fixtures for integration tests with real Ansible Vault."""

# pylint: disable=redefined-outer-name,consider-using-with

# Configure logging for integration tests

import base64
import logging
import os
import secrets
import shutil
import signal
import socket
import string
import subprocess
import tempfile
import time
from pathlib import Path
from typing import Dict, Generator, Optional

import httpx
import pytest
import yaml
from argon2 import PasswordHasher, Type  # noqa: E0611 pylint: disable=no-name-in-module
from api.logging_utils import log_secure_info

# Patch JSONB to JSON for SQLite integration tests
# This must be done before any model imports
import sys
from sqlalchemy import JSON

# Create a mock postgresql module if it doesn't exist
if 'sqlalchemy.dialects.postgresql' not in sys.modules:
    postgresql_module = type(sys)('postgresql')
    sys.modules['sqlalchemy.dialects.postgresql'] = postgresql_module

# Patch JSONB to use JSON for SQLite compatibility
sys.modules['sqlalchemy.dialects.postgresql'].JSONB = JSON

# Configure logging for integration tests
logging.basicConfig(
    level=logging.INFO,
    format="%(asctime)s - %(name)s - %(levelname)s - %(message)s",
)
logger = logging.getLogger("integration_tests")


def generate_secure_test_password(length: int = 24) -> str:
    """Generate a secure password for integration tests.

    Args:
        length: Length of the password (default: 24 for extra security)

    Returns:
        Secure random password
    """
    # Use stronger character set for integration tests
    lowercase = string.ascii_lowercase
    uppercase = string.ascii_uppercase
    digits = string.digits
    special = "!@#$%^&*()_+-=[]{}|;:,.<>?"

    # Ensure minimum security requirements
    if length < 16:
        raise ValueError("Password length must be at least 16 characters")

    # Start with one of each required character type
    password = [
        secrets.choice(lowercase),
        secrets.choice(uppercase),
        secrets.choice(digits),
        secrets.choice(special),
    ]

    # Fill remaining length
    all_chars = lowercase + uppercase + digits + special
    for _ in range(length - 4):
        password.append(secrets.choice(all_chars))

    # Shuffle to avoid predictable pattern
    secrets.SystemRandom().shuffle(password)

    return ''.join(password)


def generate_test_client_secret(length: int = 32) -> str:
    """Generate a test client secret with proper bld_s_ prefix.

    Args:
        length: Total length of the secret including prefix (default: 32)

    Returns:
        Test client secret with bld_s_ prefix
    """
    if length < 8:
        raise ValueError("Client secret length must be at least 8 characters")
    
    # Generate random part (subtract 6 for "bld_s_" prefix)
    random_part_length = max(8, length - 6)
    random_part = generate_secure_test_password(random_part_length)
    
    return f"bld_s_{random_part}"


def generate_invalid_client_id() -> str:
    """Generate an invalid client ID for testing (missing bld_ prefix).

    Returns:
        Invalid client ID without proper prefix
    """
    return "invalid_client_id_" + ''.join(secrets.choice(string.ascii_lowercase + string.digits) for _ in range(8))


def generate_invalid_client_secret() -> str:
    """Generate an invalid client secret for testing (missing bld_s_ prefix).

    Returns:
        Invalid client secret without proper prefix
    """
    return "invalid_secret_" + ''.join(secrets.choice(string.ascii_lowercase + string.digits) for _ in range(8))


class IntegrationTestConfig:
    """Configuration for integration tests."""

    # Username is not a secret
    AUTH_USERNAME = "build_stream_registrar"
    SERVER_HOST = "127.0.0.1"
    SERVER_PORT = 18443  # Use different port to avoid conflicts
    SERVER_STARTUP_TIMEOUT = 30

    @classmethod
    def get_vault_password(cls) -> str:
        """Get a dynamically generated vault password.

        Returns:
            Secure random vault password
        """
        return generate_secure_test_password(24)

    @classmethod
    def get_auth_password(cls) -> str:
        """Get a dynamically generated auth password.

        Returns:
            Secure random auth password
        """
        return generate_secure_test_password(24)


class VaultManager:  # noqa: R0902 pylint: disable=too-many-instance-attributes
    """Manages Ansible Vault setup and teardown for integration tests."""

    def __init__(self, base_dir: str):
        """Initialize vault manager.

        Args:
            base_dir: Base directory for test vault files.
        """
        self.base_dir = Path(base_dir)
        self.vault_dir = self.base_dir / "vault"
        self.vault_file = self.vault_dir / "build_stream_oauth_credentials.yml"
        self.vault_pass_file = self.base_dir / ".vault_pass"
        self.keys_dir = self.base_dir / "keys"
        self.private_key_file = self.keys_dir / "jwt_private.pem"
        self.public_key_file = self.keys_dir / "jwt_public.pem"
        self._hasher = PasswordHasher(
            time_cost=3,
            memory_cost=65536,
            parallelism=4,
            hash_len=32,
            salt_len=16,
            type=Type.ID,
        )

    def setup(self, username: str, password: str) -> None:
        """Set up vault with initial credentials.

        Args:
            username: Registration username.
            password: Registration password.
        """
        log_secure_info("info", "Setting up Ansible Vault...")
        log_secure_info("info", "  Vault directory: %s", self.vault_dir)
        log_secure_info("info", "  Vault file: %s", self.vault_file)
        log_secure_info("info", "  Vault password file: %s", self.vault_pass_file)

        self.vault_dir.mkdir(parents=True, exist_ok=True)
        log_secure_info("info", "  Created vault directory")

        self.vault_pass_file.write_text(IntegrationTestConfig.get_vault_password())
        self.vault_pass_file.chmod(0o600)
        log_secure_info("info", "  Created vault password file")

        log_secure_info("info", "  Generating Argon2id password hash...")
        password_hash = self._hasher.hash(password)

        vault_content = {
            "auth_registration": {
                "username": username,
                "password_hash": password_hash,
            },
            "oauth_clients": {},
        }

        with tempfile.NamedTemporaryFile(
            mode="w", suffix=".yml", delete=False
        ) as temp_file:
            yaml.safe_dump(vault_content, temp_file, default_flow_style=False)
            temp_path = temp_file.name

        try:
            log_secure_info("info", "  Encrypting vault with ansible-vault...")
            subprocess.run(
                [
                    "ansible-vault",
                    "encrypt",
                    temp_path,
                    "--vault-password-file",
                    str(self.vault_pass_file),
                    "--encrypt-vault-id",
                    "default",
                ],
                check=True,
                capture_output=True,
            )

            shutil.move(temp_path, str(self.vault_file))
            self.vault_file.chmod(0o600)
            log_secure_info("info", "  Vault encrypted and saved successfully")
        finally:
            if os.path.exists(temp_path):
                os.unlink(temp_path)

        log_secure_info("info", "Vault setup complete")

        # Generate JWT keys for token signing
        self._generate_jwt_keys()

    def _generate_jwt_keys(self) -> None:
        """Generate RSA key pair for JWT signing in e2e tests."""
        log_secure_info("info", "Generating JWT keys for e2e tests...")
        log_secure_info("info", "  Keys directory: %s", self.keys_dir)

        self.keys_dir.mkdir(parents=True, exist_ok=True)

        # Generate RSA private key (2048-bit for faster tests)
        subprocess.run(
            [
                "openssl", "genrsa",
                "-out", str(self.private_key_file),
                "2048",
            ],
            check=True,
            capture_output=True,
        )
        self.private_key_file.chmod(0o600)
        log_secure_info("info", "  Generated private key: %s", self.private_key_file)

        # Extract public key
        subprocess.run(
            [
                "openssl", "rsa",
                "-in", str(self.private_key_file),
                "-pubout",
                "-out", str(self.public_key_file),
            ],
            check=True,
            capture_output=True,
        )
        self.public_key_file.chmod(0o644)
        log_secure_info("info", "  Generated public key: %s", self.public_key_file)
        log_secure_info("info", "JWT keys generated successfully")

    def cleanup(self) -> None:
        """Clean up vault files."""
        log_secure_info("info", "Cleaning up vault files at: %s", self.base_dir)
        if self.base_dir.exists():
            shutil.rmtree(self.base_dir)
        log_secure_info("info", "Vault cleanup complete")


class ServerManager:
    """Manages FastAPI server lifecycle for integration tests."""

    REQUIRED_PACKAGES = [
        "fastapi",
        "uvicorn",
        "pydantic",
        "PyJWT",
        "argon2-cffi",
        "pyyaml",
        "httpx",
        "python-multipart",
        "jsonschema",
        "ansible",
        "cryptography",
        "dependency-injector",
    ]

    def __init__(  # noqa: R0913,R0917 pylint: disable=too-many-arguments,too-many-positional-arguments
        self,
        host: str,
        port: int,
        vault_manager: VaultManager,  # noqa: W0621
        project_dir: str,  # noqa: W0621
        venv_dir: str,  # noqa: W0621
    ):
        """Initialize server manager.

        Args:
            host: Server host.
            port: Server port.
            vault_manager: Vault manager instance.
            project_dir: Path to build_stream project directory.
            venv_dir: Path to virtual environment directory.
        """
        self.host = host
        self.port = port
        self.vault_manager = vault_manager
        self.project_dir = project_dir
        self.venv_dir = Path(venv_dir)
        self.process: Optional[subprocess.Popen] = None

    def _setup_venv(self) -> None:
        """Create virtual environment and install dependencies."""
        log_secure_info("info", "Setting up Python virtual environment...")
        log_secure_info("info", "  Venv directory: %s", self.venv_dir)

        if not self.venv_dir.exists():
            log_secure_info("info", "  Creating virtual environment...")
            subprocess.run(
                ["python3", "-m", "venv", str(self.venv_dir)],
                check=True,
                capture_output=True,
            )
            log_secure_info("info", "  Virtual environment created")
        else:
            log_secure_info("info", "  Virtual environment already exists")

        pip_path = self.venv_dir / "bin" / "pip"
        log_secure_info("info", "  Upgrading pip...")
        subprocess.run(
            [str(pip_path), "install", "--upgrade", "pip", "-q"],
            check=True,
            capture_output=True,
        )

        log_secure_info("info", "  Installing dependencies: %s", ", ".join(self.REQUIRED_PACKAGES))
        subprocess.run(
            [str(pip_path), "install", "-q"] + self.REQUIRED_PACKAGES,
            check=True,
            capture_output=True,
        )
        log_secure_info("info", "  Dependencies installed successfully")

    @property
    def python_path(self) -> str:
        """Get path to Python executable in virtual environment."""
        return str(self.venv_dir / "bin" / "python")

    def _is_port_in_use(self) -> bool:
        """Check if the port is already in use."""
        with socket.socket(socket.AF_INET, socket.SOCK_STREAM) as s:
            return s.connect_ex((self.host, self.port)) == 0

    def _free_port(self) -> None:
        """Free the port if it's in use."""
        if self._is_port_in_use():
            try:
                result = subprocess.run(
                    ["lsof", "-t", f"-i:{self.port}"],
                    capture_output=True,
                    text=True,
                    check=False,
                )
                if result.stdout.strip():
                    for pid in result.stdout.strip().split("\n"):
                        try:
                            os.kill(int(pid), signal.SIGKILL)
                        except (ProcessLookupError, ValueError):
                            pass
                    time.sleep(1)
            except FileNotFoundError:
                pass

    def start(self) -> None:
        """Start the FastAPI server."""
        log_secure_info("info", "Starting FastAPI server...")
        self._setup_venv()

        log_secure_info("info", "  Freeing port %d if in use...", self.port)
        self._free_port()

        log_secure_info("info", "  Configuring server environment variables...")
        env = os.environ.copy()
        env.update({
            "HOST": self.host,
            "PORT": str(self.port),
            "ANSIBLE_VAULT_PASSWORD_FILE": str(self.vault_manager.vault_pass_file),
            "OAUTH_CLIENTS_VAULT_PATH": str(self.vault_manager.vault_file),
            "AUTH_CONFIG_VAULT_PATH": str(self.vault_manager.vault_file),
            "JWT_PRIVATE_KEY_PATH": str(self.vault_manager.private_key_file),
            "JWT_PUBLIC_KEY_PATH": str(self.vault_manager.public_key_file),
            "LOG_LEVEL": "DEBUG",
            "PYTHONPATH": str(self.project_dir),
        })
        log_secure_info("info", "    HOST=%s", self.host)
        log_secure_info("info", "    PORT=%s", self.port)
        log_secure_info("info", "    ANSIBLE_VAULT_PASSWORD_FILE=%s", self.vault_manager.vault_pass_file)
        log_secure_info("info", "    OAUTH_CLIENTS_VAULT_PATH=%s", self.vault_manager.vault_file)
        log_secure_info("info", "    AUTH_CONFIG_VAULT_PATH=%s", self.vault_manager.vault_file)
        log_secure_info("info", "    JWT_PRIVATE_KEY_PATH=%s", self.vault_manager.private_key_file)
        log_secure_info("info", "    JWT_PUBLIC_KEY_PATH=%s", self.vault_manager.public_key_file)
        log_secure_info("info", "    LOG_LEVEL=DEBUG")
        log_secure_info("info", "    PYTHONPATH=%s", self.project_dir)

        log_secure_info("info", "  Starting uvicorn server...")
        log_secure_info("info", "    Python: %s", self.python_path)
        log_secure_info("info", "    Working directory: %s", self.project_dir)

        # Process needs to be managed separately for start/stop lifecycle
        # Cannot use 'with' statement as process must persist after method returns
        self.process = subprocess.Popen(  # noqa: R1732
            [
                self.python_path,
                "-m",
                "uvicorn",
                "main:app",
                "--host",
                self.host,
                "--port",
                str(self.port),
            ],
            cwd=self.project_dir,
            env=env,
            stdout=subprocess.PIPE,
            stderr=subprocess.PIPE,
        )
        log_secure_info("info", "  Server process started with PID: %d", self.process.pid)

        self._wait_for_server()

    def _wait_for_server(self) -> None:
        """Wait for server to be ready."""
        log_secure_info("info", "  Waiting for server to be ready (timeout: %ds)...", IntegrationTestConfig.SERVER_STARTUP_TIMEOUT)

        start_time = time.time()
        while time.time() - start_time < IntegrationTestConfig.SERVER_STARTUP_TIMEOUT:
            try:
                response = httpx.get(
                    f"http://{self.host}:{self.port}/health",
                    timeout=1.0,
                )
                if response.status_code == 200:
                    elapsed = time.time() - start_time
                    log_secure_info("info", "  Server is ready! (took %.1fs)", elapsed)
                    log_secure_info("info", "  Server URL: http://%s:%d", self.host, self.port)
                    return
            except httpx.RequestError:
                pass
            time.sleep(0.5)

        # Log server output before stopping
        if self.process:
            log_secure_info("error", "Server failed to start. Checking process output...")
            if self.process.stdout:
                stdout_output = self.process.stdout.read().decode()
                log_secure_info("error", "Server STDOUT:\n%s", stdout_output)
            if self.process.stderr:
                stderr_output = self.process.stderr.read().decode()
                log_secure_info("error", "Server STDERR:\n%s", stderr_output)

            # Check process return code
            self.process.poll()
            if self.process.returncode is not None:
                log_secure_info("error", "Server process exited with code: %s", self.process.returncode)

        self.stop()
        raise RuntimeError(
            f"Server failed to start within {IntegrationTestConfig.SERVER_STARTUP_TIMEOUT}s"
        )

    def stop(self) -> None:
        """Stop the FastAPI server."""
        log_secure_info("info", "Stopping FastAPI server...")
        if self.process:
            log_secure_info("info", "  Terminating server process (PID: %d)...", self.process.pid)
            self.process.terminate()
            try:
                self.process.wait(timeout=5)
                log_secure_info("info", "  Server stopped gracefully")
            except subprocess.TimeoutExpired:
                log_secure_info("info", "  Server did not stop gracefully, killing...")
                self.process.kill()
                self.process.wait()
                log_secure_info("info", "  Server killed")
            self.process = None

        self._free_port()
        log_secure_info("info", "Server shutdown complete")

    @property
    def base_url(self) -> str:
        """Get the server base URL."""
        return f"http://{self.host}:{self.port}"


@pytest.fixture(scope="module")
def integration_test_dir() -> Generator[str, None, None]:
    """Create a temporary directory for integration test files.

    Yields:
        Path to temporary directory.
    """
    temp_dir = tempfile.mkdtemp(prefix="build_stream_integration_")
    yield temp_dir
    shutil.rmtree(temp_dir, ignore_errors=True)


@pytest.fixture(scope="module")
def vault_manager(
    integration_test_dir: str,
    auth_password: str,
) -> Generator[VaultManager, None, None]:  # noqa: W0621
    """Create and configure vault manager.

    Args:
        integration_test_dir: Temporary directory for test files.
        auth_password: The auth password to use for vault setup.

    Yields:
        Configured VaultManager instance.
    """
    manager = VaultManager(integration_test_dir)
    manager.setup(
        username=IntegrationTestConfig.AUTH_USERNAME,
        password=auth_password,
    )
    yield manager
    manager.cleanup()


@pytest.fixture(scope="module")
def project_dir() -> str:
    """Get the build_stream project directory.

    Returns:
        Path to build_stream project directory.
    """
    return str(Path(__file__).parent.parent.parent)


@pytest.fixture(scope="module")
def venv_dir(integration_test_dir: str) -> str:  # noqa: W0621
    """Get path to virtual environment directory.

    Args:
        integration_test_dir: Temporary directory for test files.

    Returns:
        Path to virtual environment directory.
    """
    return os.path.join(integration_test_dir, "venv")


@pytest.fixture(scope="module")
def server_manager(
    vault_manager: VaultManager,  # noqa: W0621
    project_dir: str,  # noqa: W0621
    venv_dir: str,  # noqa: W0621
) -> Generator[ServerManager, None, None]:
    """Create and manage the FastAPI server.

    Args:
        vault_manager: Vault manager fixture.
        project_dir: Project directory fixture.
        venv_dir: Virtual environment directory fixture.

    Yields:
        Running ServerManager instance.
    """
    manager = ServerManager(
        host=IntegrationTestConfig.SERVER_HOST,
        port=IntegrationTestConfig.SERVER_PORT,
        vault_manager=vault_manager,
        project_dir=project_dir,
        venv_dir=venv_dir,
    )
    manager.start()
    yield manager
    manager.stop()


@pytest.fixture(scope="module")
def base_url(server_manager: ServerManager) -> str:  # noqa: W0621
    """Get the server base URL.

    Args:
        server_manager: Server manager fixture.

    Returns:
        Server base URL.
    """
    return server_manager.base_url


@pytest.fixture(scope="module")
def auth_password() -> str:
    """Generate a single auth password for the entire test module.

    Returns:
        Auth password to be used consistently across tests.
    """
    return IntegrationTestConfig.get_auth_password()


@pytest.fixture
def valid_auth_header(auth_password: str) -> Dict[str, str]:  # noqa: W0621
    """Create valid Basic Auth header.

    Args:
        auth_password: The auth password to use.

    Returns:
        Dictionary with Authorization header.
    """
    credentials = base64.b64encode(
        f"{IntegrationTestConfig.AUTH_USERNAME}:{auth_password}".encode()
    ).decode()
    return {"Authorization": f"Basic {credentials}"}


@pytest.fixture
def invalid_auth_header() -> Dict[str, str]:
    """Create invalid Basic Auth header.

    Returns:
        Dictionary with invalid Authorization header.
    """
    credentials = base64.b64encode(b"wrong_user:wrong_password").decode()
    return {"Authorization": f"Basic {credentials}"}


@pytest.fixture
def reset_vault(
    vault_manager: VaultManager,
    auth_password: str,
) -> Generator[None, None, None]:  # noqa: W0621
    """Reset vault to initial state before and after test.

    Args:
        vault_manager: Vault manager fixture.
        auth_password: The auth password to use for vault setup.

    Yields:
        None
    """
    vault_manager.setup(
        username=IntegrationTestConfig.AUTH_USERNAME,
        password=auth_password,
    )
    yield
    vault_manager.setup(
        username=IntegrationTestConfig.AUTH_USERNAME,
        password=auth_password,
    )


================================================
FILE: build_stream/tests/integration/core/catalog/test_adapter_cli_defaults.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Tests for adapter CLI defaults."""

import os
import sys
import tempfile
import unittest
import pytest

HERE = os.path.dirname(__file__)
PROJECT_ROOT = os.path.dirname(os.path.dirname(os.path.dirname(os.path.dirname(HERE))))  # Go up 5 levels to reach build_stream root
if PROJECT_ROOT not in sys.path:
    sys.path.insert(0, PROJECT_ROOT)

from core.catalog.adapter import generate_omnia_json_from_catalog, _DEFAULT_SCHEMA_PATH

pytestmark = pytest.mark.skip(reason="Test file marked to be ignored")


class TestAdapterDefaults(unittest.TestCase):
    def test_default_schema_path_points_to_resources(self):
        # The default schema path should point to the actual resources directory in core/catalog
        expected_schema = os.path.join(PROJECT_ROOT, "core", "catalog", "resources", "CatalogSchema.json")
        self.assertEqual(os.path.abspath(_DEFAULT_SCHEMA_PATH), os.path.abspath(expected_schema))

    def test_generate_omnia_json_with_defaults_writes_output(self):
        catalog_path = os.path.abspath(
            os.path.join(os.path.dirname(__file__), "..", "..", "..", "fixtures", "catalogs", "catalog_rhel.json")
        )
        
        # Skip test if fixture doesn't exist
        if not os.path.exists(catalog_path):
            self.skipTest("Catalog fixture not found")
            return

        with tempfile.TemporaryDirectory() as tmpdir:
            generate_omnia_json_from_catalog(
                catalog_path=catalog_path,
                output_root=tmpdir,
            )

            # We expect some JSON files under arch/os/version
            found_any_json = False
            for root, dirs, files in os.walk(tmpdir):
                if any(f.endswith('.json') for f in files):
                    found_any_json = True
                    break

            self.assertTrue(found_any_json, "No JSON configs generated under any arch/os/version")


if __name__ == "__main__":
    unittest.main()


================================================
FILE: build_stream/tests/integration/core/catalog/test_adapter_policy.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for adapter_policy module."""

import json
import os
import sys
import tempfile
import unittest

HERE = os.path.dirname(__file__)
CATALOG_PARSER_DIR = os.path.dirname(HERE)
PROJECT_ROOT = os.path.dirname(CATALOG_PARSER_DIR)
if PROJECT_ROOT not in sys.path:
    sys.path.insert(0, PROJECT_ROOT)

from core.catalog.adapter_policy import (
    validate_policy_config,
    discover_architectures,
    discover_os_versions,
    transform_package,
    apply_substring_filter,
    compute_common_packages,
    apply_extract_common_filter,
    apply_extract_unique_filter,
    apply_filter,
    merge_transform,
    compute_common_keys_from_roles,
    derive_common_role,
    check_conditions,
    process_target_spec,
    write_config_file,
    generate_configs_from_policy,
    _DEFAULT_POLICY_PATH,
    _DEFAULT_SCHEMA_PATH,
)
from core.catalog import adapter_policy_schema_consts as schema


class TestValidatePolicyConfig(unittest.TestCase):
    """Tests for validate_policy_config function."""

    def setUp(self):
        self.valid_policy = {
            "version": "2.0.0",
            "targets": {
                "test.json": {
                    "sources": [
                        {
                            "source_file": "source.json",
                            "pulls": [{"source_key": "role1"}]
                        }
                    ]
                }
            }
        }
        self.schema_path = _DEFAULT_SCHEMA_PATH
        with open(self.schema_path, "r", encoding="utf-8") as f:
            self.schema_config = json.load(f)

    def test_valid_policy_passes_validation(self):
        """Valid policy should not raise any exception."""
        validate_policy_config(
            self.valid_policy,
            self.schema_config,
            policy_path="test_policy.json",
            schema_path=self.schema_path
        )

    def test_missing_version_raises_error(self):
        """Policy missing required 'version' field should raise ValueError."""
        invalid_policy = {"targets": {}}
        with self.assertRaises(ValueError) as ctx:
            validate_policy_config(
                invalid_policy,
                self.schema_config,
                policy_path="test_policy.json",
                schema_path=self.schema_path
            )
        self.assertIn("Adapter policy validation failed", str(ctx.exception))
        self.assertIn("version", str(ctx.exception))

    def test_missing_targets_raises_error(self):
        """Policy missing required 'targets' field should raise ValueError."""
        invalid_policy = {"version": "2.0.0"}
        with self.assertRaises(ValueError) as ctx:
            validate_policy_config(
                invalid_policy,
                self.schema_config,
                policy_path="test_policy.json",
                schema_path=self.schema_path
            )
        self.assertIn("Adapter policy validation failed", str(ctx.exception))
        self.assertIn("targets", str(ctx.exception))

    def test_invalid_target_spec_raises_error(self):
        """Target spec missing 'sources' should raise ValueError."""
        invalid_policy = {
            "version": "2.0.0",
            "targets": {
                "test.json": {}
            }
        }
        with self.assertRaises(ValueError) as ctx:
            validate_policy_config(
                invalid_policy,
                self.schema_config,
                policy_path="test_policy.json",
                schema_path=self.schema_path
            )
        self.assertIn("Adapter policy validation failed", str(ctx.exception))

    def test_allowlist_filter_policy_validates(self):
        """Policy using allowlist filter type should validate against schema."""
        policy = {
            "version": "2.0.0",
            "targets": {
                "openldap.json": {
                    "sources": [
                        {
                            "source_file": "base_os.json",
                            "pulls": [
                                {
                                    "source_key": "Base OS",
                                    "filter": {
                                        "type": "allowlist",
                                        "field": "package",
                                        "values": ["openldap-clients"],
                                        "case_sensitive": False,
                                    },
                                }
                            ],
                        }
                    ]
                }
            },
        }

        validate_policy_config(
            policy,
            self.schema_config,
            policy_path="test_policy.json",
            schema_path=self.schema_path,
        )

    def test_field_in_filter_policy_validates(self):
        """Policy using field_in filter type should validate against schema."""
        policy = {
            "version": "2.0.0",
            "targets": {
                "openldap.json": {
                    "sources": [
                        {
                            "source_file": "base_os.json",
                            "pulls": [
                                {
                                    "source_key": "Base OS",
                                    "filter": {
                                        "type": "field_in",
                                        "field": "feature",
                                        "values": ["openldap"],
                                        "case_sensitive": False,
                                    },
                                }
                            ],
                        }
                    ]
                }
            },
        }

        validate_policy_config(
            policy,
            self.schema_config,
            policy_path="test_policy.json",
            schema_path=self.schema_path,
        )

    def test_any_of_filter_requires_filters(self):
        """any_of filter must define nested filters."""
        policy = {
            "version": "2.0.0",
            "targets": {
                "openldap.json": {
                    "sources": [
                        {
                            "source_file": "base_os.json",
                            "pulls": [
                                {"source_key": "Base OS", "filter": {"type": "any_of"}}
                            ],
                        }
                    ]
                }
            },
        }

        with self.assertRaises(ValueError) as ctx:
            validate_policy_config(
                policy,
                self.schema_config,
                policy_path="test_policy.json",
                schema_path=self.schema_path,
            )
        self.assertIn("Adapter policy validation failed", str(ctx.exception))

    def test_any_of_filter_policy_validates(self):
        """Policy using any_of filter type should validate against schema."""
        policy = {
            "version": "2.0.0",
            "targets": {
                "openldap.json": {
                    "sources": [
                        {
                            "source_file": "base_os.json",
                            "pulls": [
                                {
                                    "source_key": "Base OS",
                                    "filter": {
                                        "type": "any_of",
                                        "filters": [
                                            {"type": "substring", "values": ["ldap"]},
                                            {"type": "field_in", "field": "feature", "values": ["openldap"]},
                                        ],
                                    },
                                }
                            ],
                        }
                    ]
                }
            },
        }

        validate_policy_config(
            policy,
            self.schema_config,
            policy_path="test_policy.json",
            schema_path=self.schema_path,
        )


class TestDiscoverArchitectures(unittest.TestCase):
    """Tests for discover_architectures function."""

    def test_discovers_architecture_directories(self):
        """Should return list of subdirectory names."""
        with tempfile.TemporaryDirectory() as tmpdir:
            os.makedirs(os.path.join(tmpdir, "x86_64"))
            os.makedirs(os.path.join(tmpdir, "aarch64"))
            # Create a file (should be ignored)
            with open(os.path.join(tmpdir, "readme.txt"), "w") as f:
                f.write("test")

            archs = discover_architectures(tmpdir)
            self.assertEqual(sorted(archs), ["aarch64", "x86_64"])

    def test_returns_empty_for_nonexistent_dir(self):
        """Should return empty list for non-existent directory."""
        archs = discover_architectures("/nonexistent/path")
        self.assertEqual(archs, [])

    def test_returns_empty_for_empty_dir(self):
        """Should return empty list for empty directory."""
        with tempfile.TemporaryDirectory() as tmpdir:
            archs = discover_architectures(tmpdir)
            self.assertEqual(archs, [])


class TestDiscoverOsVersions(unittest.TestCase):
    """Tests for discover_os_versions function."""

    def test_discovers_os_and_versions(self):
        """Should return list of (os_family, version) tuples."""
        with tempfile.TemporaryDirectory() as tmpdir:
            os.makedirs(os.path.join(tmpdir, "x86_64", "rhel", "9.0"))
            os.makedirs(os.path.join(tmpdir, "x86_64", "rhel", "8.0"))
            os.makedirs(os.path.join(tmpdir, "x86_64", "ubuntu", "22.04"))

            results = discover_os_versions(tmpdir, "x86_64")
            self.assertEqual(len(results), 3)
            self.assertIn(("rhel", "9.0"), results)
            self.assertIn(("rhel", "8.0"), results)
            self.assertIn(("ubuntu", "22.04"), results)

    def test_returns_empty_for_nonexistent_arch(self):
        """Should return empty list for non-existent architecture."""
        with tempfile.TemporaryDirectory() as tmpdir:
            results = discover_os_versions(tmpdir, "nonexistent")
            self.assertEqual(results, [])


class TestTransformPackage(unittest.TestCase):
    """Tests for transform_package function."""

    def test_no_transform_returns_copy(self):
        """No transform config should return a copy of the package."""
        pkg = {"name": "test", "version": "1.0", "type": "git"}
        result = transform_package(pkg, None)
        self.assertEqual(result, pkg)
        self.assertIsNot(result, pkg)

    def test_exclude_fields(self):
        """Should exclude specified fields."""
        pkg = {"name": "test", "version": "1.0", "architecture": "x86_64", "type": "git"}
        transform = {schema.EXCLUDE_FIELDS: ["architecture"]}
        result = transform_package(pkg, transform)
        self.assertEqual(result, {"name": "test", "version": "1.0", "type": "git"})

    def test_rename_fields(self):
        """Should rename specified fields."""
        pkg = {"name": "test", "ver": "1.0", "type": "git"}
        transform = {schema.RENAME_FIELDS: {"ver": "version"}}
        result = transform_package(pkg, transform)
        self.assertEqual(result, {"name": "test", "version": "1.0", "type": "git"})

    def test_exclude_and_rename_combined(self):
        """Should apply both exclude and rename."""
        pkg = {"name": "test", "ver": "1.0", "arch": "x86_64", "type": "git"}
        transform = {
            schema.EXCLUDE_FIELDS: ["arch"],
            schema.RENAME_FIELDS: {"ver": "version"}
        }
        result = transform_package(pkg, transform)
        self.assertEqual(result, {"name": "test", "version": "1.0", "type": "git"})


class TestApplySubstringFilter(unittest.TestCase):
    """Tests for apply_substring_filter function."""

    def test_filters_by_substring(self):
        """Should filter packages by substring match."""
        packages = [
            {"package": "kubernetes-client"},
            {"package": "kubernetes-server"},
            {"package": "docker-ce"},
        ]
        filter_config = {
            schema.FIELD: "package",
            schema.VALUES: ["kubernetes"]
        }
        result = apply_substring_filter(packages, filter_config)
        self.assertEqual(len(result), 2)
        self.assertTrue(all("kubernetes" in p["package"] for p in result))

    def test_case_insensitive_by_default(self):
        """Should be case-insensitive by default."""
        packages = [
            {"package": "Kubernetes-Client"},
            {"package": "docker-ce"},
        ]
        filter_config = {
            schema.FIELD: "package",
            schema.VALUES: ["kubernetes"]
        }
        result = apply_substring_filter(packages, filter_config)
        self.assertEqual(len(result), 1)

    def test_case_sensitive_when_specified(self):
        """Should be case-sensitive when specified."""
        packages = [
            {"package": "Kubernetes-Client"},
            {"package": "kubernetes-server"},
        ]
        filter_config = {
            schema.FIELD: "package",
            schema.VALUES: ["kubernetes"],
            schema.CASE_SENSITIVE: True
        }
        result = apply_substring_filter(packages, filter_config)
        self.assertEqual(len(result), 1)
        self.assertEqual(result[0]["package"], "kubernetes-server")

    def test_empty_values_returns_all(self):
        """Empty values list should return all packages."""
        packages = [{"package": "test1"}, {"package": "test2"}]
        filter_config = {schema.FIELD: "package", schema.VALUES: []}
        result = apply_substring_filter(packages, filter_config)
        self.assertEqual(result, packages)


class TestAllowlistAndFieldFilters(unittest.TestCase):
    def test_allowlist_matches_exact_package_names(self):
        packages = [
            {"package": "openldap-clients"},
            {"package": "openldap-servers"},
            {"package": "openmpi"},
        ]
        filter_config = {
            schema.TYPE: schema.ALLOWLIST_FILTER,
            schema.FIELD: "package",
            schema.VALUES: ["openldap-clients"],
            schema.CASE_SENSITIVE: False,
        }

        result = apply_filter(packages, {}, "Base OS", filter_config)
        self.assertEqual([p["package"] for p in result], ["openldap-clients"])

    def test_field_in_matches_classification_field(self):
        packages = [
            {"package": "vendor-ldap", "feature": "openldap"},
            {"package": "vendor-ldap2", "feature": "other"},
            {"package": "no-feature"},
        ]
        filter_config = {
            schema.TYPE: schema.FIELD_IN_FILTER,
            schema.FIELD: "feature",
            schema.VALUES: ["openldap"],
            schema.CASE_SENSITIVE: False,
        }

        result = apply_filter(packages, {}, "Base OS", filter_config)
        self.assertEqual([p["package"] for p in result], ["vendor-ldap"])

    def test_any_of_combines_multiple_strategies(self):
        packages = [
            {"package": "openldap-clients"},
            {"package": "vendor-ldap", "feature": "openldap"},
            {"package": "slapd-utils"},
            {"package": "unrelated"},
        ]

        filter_config = {
            schema.TYPE: schema.ANY_OF_FILTER,
            schema.FILTERS: [
                {
                    schema.TYPE: schema.ALLOWLIST_FILTER,
                    schema.FIELD: "package",
                    schema.VALUES: ["openldap-clients"],
                    schema.CASE_SENSITIVE: False,
                },
                {
                    schema.TYPE: schema.FIELD_IN_FILTER,
                    schema.FIELD: "feature",
                    schema.VALUES: ["openldap"],
                    schema.CASE_SENSITIVE: False,
                },
                {
                    schema.TYPE: schema.SUBSTRING_FILTER,
                    schema.FIELD: "package",
                    schema.VALUES: ["slapd"],
                    schema.CASE_SENSITIVE: False,
                },
            ],
        }

        result = apply_filter(packages, {}, "Base OS", filter_config)
        self.assertEqual(
            [p["package"] for p in result],
            ["openldap-clients", "vendor-ldap", "slapd-utils"],
        )


class TestComputeCommonPackages(unittest.TestCase):
    """Tests for compute_common_packages function."""

    def test_finds_common_packages(self):
        """Should find packages common across multiple keys."""
        source_data = {
            "role1": {schema.PACKAGES: [
                {"name": "common-pkg", "version": "1.0"},
                {"name": "unique1", "version": "1.0"},
            ]},
            "role2": {schema.PACKAGES: [
                {"name": "common-pkg", "version": "1.0"},
                {"name": "unique2", "version": "1.0"},
            ]},
        }
        common_keys, key_to_pkg = compute_common_packages(
            source_data, ["role1", "role2"], min_occurrences=2
        )
        self.assertEqual(len(common_keys), 1)

    def test_respects_min_occurrences(self):
        """Should respect min_occurrences threshold."""
        source_data = {
            "role1": {schema.PACKAGES: [{"name": "pkg1"}]},
            "role2": {schema.PACKAGES: [{"name": "pkg1"}]},
            "role3": {schema.PACKAGES: [{"name": "pkg2"}]},
        }
        common_keys, _ = compute_common_packages(
            source_data, ["role1", "role2", "role3"], min_occurrences=3
        )
        self.assertEqual(len(common_keys), 0)


class TestMergeTransform(unittest.TestCase):
    """Tests for merge_transform function."""

    def test_none_inputs_return_none(self):
        """Both None should return None."""
        self.assertIsNone(merge_transform(None, None))

    def test_base_only(self):
        """Only base should return base."""
        base = {schema.EXCLUDE_FIELDS: ["arch"]}
        self.assertEqual(merge_transform(base, None), base)

    def test_override_only(self):
        """Only override should return override."""
        override = {schema.EXCLUDE_FIELDS: ["arch"]}
        self.assertEqual(merge_transform(None, override), override)

    def test_override_wins(self):
        """Override values should win."""
        base = {schema.EXCLUDE_FIELDS: ["arch"]}
        override = {schema.EXCLUDE_FIELDS: ["version"]}
        result = merge_transform(base, override)
        self.assertEqual(result[schema.EXCLUDE_FIELDS], ["version"])


class TestCheckConditions(unittest.TestCase):
    """Tests for check_conditions function."""

    def test_no_conditions_returns_true(self):
        """No conditions should always return True."""
        self.assertTrue(check_conditions(None, "x86_64", "rhel", "9.0"))

    def test_architecture_condition(self):
        """Should check architecture condition."""
        conditions = {schema.ARCHITECTURES: ["x86_64"]}
        self.assertTrue(check_conditions(conditions, "x86_64", "rhel", "9.0"))
        self.assertFalse(check_conditions(conditions, "aarch64", "rhel", "9.0"))

    def test_os_family_condition(self):
        """Should check OS family condition."""
        conditions = {schema.OS_FAMILIES: ["rhel"]}
        self.assertTrue(check_conditions(conditions, "x86_64", "rhel", "9.0"))
        self.assertFalse(check_conditions(conditions, "x86_64", "ubuntu", "22.04"))

    def test_os_version_condition(self):
        """Should check OS version condition."""
        conditions = {schema.OS_VERSIONS: ["9.0"]}
        self.assertTrue(check_conditions(conditions, "x86_64", "rhel", "9.0"))
        self.assertFalse(check_conditions(conditions, "x86_64", "rhel", "8.0"))

    def test_multiple_conditions_all_must_pass(self):
        """All conditions must pass."""
        conditions = {
            schema.ARCHITECTURES: ["x86_64"],
            schema.OS_FAMILIES: ["rhel"],
            schema.OS_VERSIONS: ["9.0"]
        }
        self.assertTrue(check_conditions(conditions, "x86_64", "rhel", "9.0"))
        self.assertFalse(check_conditions(conditions, "aarch64", "rhel", "9.0"))


class TestDeriveCommonRole(unittest.TestCase):
    """Tests for derive_common_role function."""

    def test_derives_common_packages(self):
        """Should derive common packages into new role."""
        target_roles = {
            "role1": [{"name": "common"}, {"name": "unique1"}],
            "role2": [{"name": "common"}, {"name": "unique2"}],
        }
        derive_common_role(
            target_roles,
            derived_key="common_role",
            from_keys=["role1", "role2"],
            min_occurrences=2,
            remove_from_sources=True
        )
        self.assertIn("common_role", target_roles)
        self.assertEqual(len(target_roles["common_role"]), 1)
        self.assertEqual(target_roles["common_role"][0]["name"], "common")

    def test_removes_from_sources_when_specified(self):
        """Should remove common packages from source roles."""
        target_roles = {
            "role1": [{"name": "common"}, {"name": "unique1"}],
            "role2": [{"name": "common"}, {"name": "unique2"}],
        }
        derive_common_role(
            target_roles,
            derived_key="common_role",
            from_keys=["role1", "role2"],
            min_occurrences=2,
            remove_from_sources=True
        )
        self.assertEqual(len(target_roles["role1"]), 1)
        self.assertEqual(target_roles["role1"][0]["name"], "unique1")

    def test_keeps_sources_when_not_removing(self):
        """Should keep source packages when remove_from_sources=False."""
        target_roles = {
            "role1": [{"name": "common"}, {"name": "unique1"}],
            "role2": [{"name": "common"}, {"name": "unique2"}],
        }
        derive_common_role(
            target_roles,
            derived_key="common_role",
            from_keys=["role1", "role2"],
            min_occurrences=2,
            remove_from_sources=False
        )
        self.assertEqual(len(target_roles["role1"]), 2)


class TestWriteConfigFile(unittest.TestCase):
    """Tests for write_config_file function."""

    def test_writes_valid_json(self):
        """Should write valid JSON file."""
        with tempfile.TemporaryDirectory() as tmpdir:
            file_path = os.path.join(tmpdir, "subdir", "test.json")
            config = {
                "role1": {schema.CLUSTER: [{"name": "pkg1"}]},
                "role2": {schema.CLUSTER: [{"name": "pkg2"}]},
            }
            write_config_file(file_path, config)

            self.assertTrue(os.path.exists(file_path))
            with open(file_path, "r", encoding="utf-8") as f:
                loaded = json.load(f)
            self.assertEqual(loaded["role1"][schema.CLUSTER][0]["name"], "pkg1")

    def test_creates_parent_directories(self):
        """Should create parent directories if they don't exist."""
        with tempfile.TemporaryDirectory() as tmpdir:
            file_path = os.path.join(tmpdir, "a", "b", "c", "test.json")
            config = {"role1": {schema.CLUSTER: []}}
            write_config_file(file_path, config)
            self.assertTrue(os.path.exists(file_path))


class TestGenerateConfigsFromPolicy(unittest.TestCase):
    """Tests for generate_configs_from_policy function."""

    def setUp(self):
        self.test_fixtures_dir = os.path.join(CATALOG_PARSER_DIR, "test_fixtures")
        self.test_policy_path = os.path.join(self.test_fixtures_dir, "adapter_policy_test.json")

    def test_generates_output_files(self):
        """Should generate output JSON files from valid policy."""
        with tempfile.TemporaryDirectory() as tmpdir:
            # Create input directory structure
            input_dir = os.path.join(tmpdir, "input")
            output_dir = os.path.join(tmpdir, "output")
            os.makedirs(os.path.join(input_dir, "x86_64", "rhel", "9.0"))

            # Create source file
            source_data = {
                "Base OS": {
                    schema.PACKAGES: [
                        {"package": "test-pkg", "version": "1.0"}
                    ]
                }
            }
            with open(os.path.join(input_dir, "x86_64", "rhel", "9.0", "base_os.json"), "w") as f:
                json.dump(source_data, f)

            # Create minimal policy
            policy = {
                "version": "2.0.0",
                "targets": {
                    "output.json": {
                        "sources": [{
                            "source_file": "base_os.json",
                            "pulls": [{"source_key": "Base OS", "target_key": "base_role"}]
                        }]
                    }
                }
            }
            policy_path = os.path.join(tmpdir, "policy.json")
            with open(policy_path, "w") as f:
                json.dump(policy, f)

            generate_configs_from_policy(
                input_dir=input_dir,
                output_dir=output_dir,
                policy_path=policy_path,
                schema_path=_DEFAULT_SCHEMA_PATH
            )

            output_file = os.path.join(output_dir, "input", "config", "x86_64", "rhel", "9.0", "output.json")
            self.assertTrue(os.path.exists(output_file))

    def test_generates_openldap_with_any_of_filter(self):
        with tempfile.TemporaryDirectory() as tmpdir:
            input_dir = os.path.join(tmpdir, "input")
            output_dir = os.path.join(tmpdir, "output")
            os.makedirs(os.path.join(input_dir, "x86_64", "rhel", "9.0"))

            source_data = {
                "Base OS": {
                    schema.PACKAGES: [
                        {"package": "openldap-clients", "type": "rpm", "architecture": ["x86_64"]},
                        {"package": "vendor-directory-client", "type": "rpm", "architecture": ["x86_64"], "feature": "openldap"},
                        {"package": "slapd-utils", "type": "rpm", "architecture": ["x86_64"]},
                        {"package": "bash", "type": "rpm", "architecture": ["x86_64"]},
                    ]
                }
            }
            with open(os.path.join(input_dir, "x86_64", "rhel", "9.0", "base_os.json"), "w") as f:
                json.dump(source_data, f)

            policy = {
                "version": "2.0.0",
                "targets": {
                    "openldap.json": {
                        "transform": {"exclude_fields": ["architecture"]},
                        "sources": [
                            {
                                "source_file": "base_os.json",
                                "pulls": [
                                    {
                                        "source_key": "Base OS",
                                        "target_key": "openldap",
                                        "filter": {
                                            "type": "any_of",
                                            "filters": [
                                                {"type": "allowlist", "field": "package", "values": ["openldap-clients"], "case_sensitive": False},
                                                {"type": "field_in", "field": "feature", "values": ["openldap"], "case_sensitive": False},
                                                {"type": "substring", "field": "package", "values": ["slapd"], "case_sensitive": False},
                                            ],
                                        },
                                    }
                                ],
                            }
                        ],
                    }
                },
            }
            policy_path = os.path.join(tmpdir, "policy.json")
            with open(policy_path, "w") as f:
                json.dump(policy, f)

            generate_configs_from_policy(
                input_dir=input_dir,
                output_dir=output_dir,
                policy_path=policy_path,
                schema_path=_DEFAULT_SCHEMA_PATH,
            )

            output_file = os.path.join(output_dir, "input", "config", "x86_64", "rhel", "9.0", "openldap.json")
            self.assertTrue(os.path.exists(output_file))

            with open(output_file, "r", encoding="utf-8") as f:
                out_json = json.load(f)

            self.assertIn("openldap", out_json)
            pkgs = out_json["openldap"][schema.CLUSTER]

            self.assertEqual(
                [p.get("package") for p in pkgs],
                ["openldap-clients", "vendor-directory-client", "slapd-utils"],
            )
            self.assertTrue(all("architecture" not in p for p in pkgs))

    def test_invalid_policy_raises_error(self):
        """Should raise ValueError for invalid policy."""
        with tempfile.TemporaryDirectory() as tmpdir:
            input_dir = os.path.join(tmpdir, "input")
            output_dir = os.path.join(tmpdir, "output")
            os.makedirs(input_dir)

            # Create invalid policy (missing version)
            invalid_policy = {"targets": {}}
            policy_path = os.path.join(tmpdir, "invalid_policy.json")
            with open(policy_path, "w") as f:
                json.dump(invalid_policy, f)

            with self.assertRaises(ValueError) as ctx:
                generate_configs_from_policy(
                    input_dir=input_dir,
                    output_dir=output_dir,
                    policy_path=policy_path,
                    schema_path=_DEFAULT_SCHEMA_PATH
                )
            self.assertIn("Adapter policy validation failed", str(ctx.exception))

    def test_missing_input_dir_raises_file_not_found(self):
        """Should raise FileNotFoundError if input_dir does not exist."""
        with tempfile.TemporaryDirectory() as tmpdir:
            output_dir = os.path.join(tmpdir, "output")
            missing_input_dir = os.path.join(tmpdir, "does_not_exist")

            with self.assertRaises(FileNotFoundError):
                generate_configs_from_policy(
                    input_dir=missing_input_dir,
                    output_dir=output_dir,
                    policy_path=_DEFAULT_POLICY_PATH,
                    schema_path=_DEFAULT_SCHEMA_PATH,
                )

    def test_missing_policy_file_raises_file_not_found(self):
        """Should raise FileNotFoundError if policy_path does not exist."""
        with tempfile.TemporaryDirectory() as tmpdir:
            input_dir = os.path.join(tmpdir, "input")
            output_dir = os.path.join(tmpdir, "output")
            os.makedirs(input_dir)

            missing_policy_path = os.path.join(tmpdir, "missing_policy.json")

            with self.assertRaises(FileNotFoundError):
                generate_configs_from_policy(
                    input_dir=input_dir,
                    output_dir=output_dir,
                    policy_path=missing_policy_path,
                    schema_path=_DEFAULT_SCHEMA_PATH,
                )

    def test_missing_schema_file_raises_file_not_found(self):
        """Should raise FileNotFoundError if schema_path does not exist."""
        with tempfile.TemporaryDirectory() as tmpdir:
            input_dir = os.path.join(tmpdir, "input")
            output_dir = os.path.join(tmpdir, "output")
            os.makedirs(input_dir)

            missing_schema_path = os.path.join(tmpdir, "missing_schema.json")

            with self.assertRaises(FileNotFoundError):
                generate_configs_from_policy(
                    input_dir=input_dir,
                    output_dir=output_dir,
                    policy_path=_DEFAULT_POLICY_PATH,
                    schema_path=missing_schema_path,
                )


class TestDefaultPaths(unittest.TestCase):
    """Tests for default path constants."""

    def test_default_policy_path_exists(self):
        """Default policy path should point to existing file."""
        self.assertTrue(
            os.path.exists(_DEFAULT_POLICY_PATH),
            f"Default policy file not found: {_DEFAULT_POLICY_PATH}"
        )

    def test_default_schema_path_exists(self):
        """Default schema path should point to existing file."""
        self.assertTrue(
            os.path.exists(_DEFAULT_SCHEMA_PATH),
            f"Default schema file not found: {_DEFAULT_SCHEMA_PATH}"
        )

    def test_default_policy_validates_against_schema(self):
        """Default policy should validate against default schema."""
        with open(_DEFAULT_POLICY_PATH, "r", encoding="utf-8") as f:
            policy = json.load(f)
        with open(_DEFAULT_SCHEMA_PATH, "r", encoding="utf-8") as f:
            schema_config = json.load(f)

        # Should not raise
        validate_policy_config(
            policy,
            schema_config,
            policy_path=_DEFAULT_POLICY_PATH,
            schema_path=_DEFAULT_SCHEMA_PATH
        )


class TestProcessTargetSpec(unittest.TestCase):
    """Tests for process_target_spec function."""

    def test_processes_simple_target(self):
        """Should process a simple target specification."""
        source_files = {
            "source.json": {
                "role1": {schema.PACKAGES: [{"name": "pkg1"}]}
            }
        }
        target_spec = {
            "sources": [{
                "source_file": "source.json",
                "pulls": [{"source_key": "role1", "target_key": "output_role"}]
            }]
        }
        target_configs = {}

        process_target_spec(
            target_file="output.json",
            target_spec=target_spec,
            source_files=source_files,
            target_configs=target_configs,
            arch="x86_64",
            os_family="rhel",
            os_version="9.0"
        )

        self.assertIn("output.json", target_configs)
        self.assertIn("output_role", target_configs["output.json"])

    def test_skips_when_conditions_not_met(self):
        """Should skip target when conditions are not met."""
        source_files = {"source.json": {"role1": {schema.PACKAGES: []}}}
        target_spec = {
            "conditions": {schema.ARCHITECTURES: ["aarch64"]},
            "sources": [{
                "source_file": "source.json",
                "pulls": [{"source_key": "role1"}]
            }]
        }
        target_configs = {}

        process_target_spec(
            target_file="output.json",
            target_spec=target_spec,
            source_files=source_files,
            target_configs=target_configs,
            arch="x86_64",
            os_family="rhel",
            os_version="9.0"
        )

        self.assertNotIn("output.json", target_configs)

    def test_applies_transform(self):
        """Should apply transform to packages."""
        source_files = {
            "source.json": {
                "role1": {schema.PACKAGES: [
                    {"name": "pkg1", "architecture": "x86_64"}
                ]}
            }
        }
        target_spec = {
            "transform": {schema.EXCLUDE_FIELDS: ["architecture"]},
            "sources": [{
                "source_file": "source.json",
                "pulls": [{"source_key": "role1", "target_key": "output_role"}]
            }]
        }
        target_configs = {}

        process_target_spec(
            target_file="output.json",
            target_spec=target_spec,
            source_files=source_files,
            target_configs=target_configs,
            arch="x86_64",
            os_family="rhel",
            os_version="9.0"
        )

        pkgs = target_configs["output.json"]["output_role"][schema.CLUSTER]
        self.assertNotIn("architecture", pkgs[0])


if __name__ == "__main__":
    unittest.main()


================================================
FILE: build_stream/tests/integration/core/catalog/test_generator_cli_defaults.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import os
import sys
import tempfile
import unittest

HERE = os.path.dirname(__file__)
PROJECT_ROOT = os.path.dirname(os.path.dirname(os.path.dirname(os.path.dirname(HERE))))  # Go up 5 levels to reach build_stream root
if PROJECT_ROOT not in sys.path:
    sys.path.insert(0, PROJECT_ROOT)

from core.catalog.generator import generate_root_json_from_catalog, _DEFAULT_SCHEMA_PATH


class TestGeneratorDefaults(unittest.TestCase):
    def test_default_schema_path_points_to_resources(self):
        # The default schema path should point to the actual resources directory
        expected_schema = os.path.join(PROJECT_ROOT, "core", "catalog", "resources", "CatalogSchema.json")
        self.assertEqual(os.path.abspath(_DEFAULT_SCHEMA_PATH), os.path.abspath(expected_schema))

    def test_generate_root_json_with_defaults_writes_output(self):
        catalog_path = os.path.abspath(
            os.path.join(os.path.dirname(__file__), "..", "..", "..", "fixtures", "catalogs", "catalog_rhel.json")
        )
        
        # Skip test if fixture doesn't exist
        if not os.path.exists(catalog_path):
            self.skipTest("Catalog fixture not found")
            return

        with tempfile.TemporaryDirectory() as tmpdir:
            generate_root_json_from_catalog(
                catalog_path=catalog_path,
                output_root=tmpdir,
            )

            # We expect at least one arch/os/version directory with functional_layer.json
            found = False
            for root, dirs, files in os.walk(tmpdir):
                if "functional_layer.json" in files:
                    found = True
                    break

            self.assertTrue(found, "functional_layer.json not generated under any arch/os/version")


if __name__ == "__main__":
    unittest.main()


================================================
FILE: build_stream/tests/integration/core/catalog/test_generator_package_list.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for get_package_list function in generator module."""

import json
import os
import sys
import tempfile
import unittest

from jsonschema import ValidationError

HERE = os.path.dirname(__file__)
PROJECT_ROOT = os.path.dirname(os.path.dirname(os.path.dirname(os.path.dirname(HERE))))  # Go up 5 levels to reach build_stream root
if PROJECT_ROOT not in sys.path:
    sys.path.insert(0, PROJECT_ROOT)

from core.catalog.generator import (
    FeatureList,
    serialize_json,
    get_package_list,
)


class TestGetPackageList(unittest.TestCase):
    """Tests for get_package_list function."""

    def setUp(self):
        """Set up test fixtures."""
        self.base_dir = os.path.dirname(__file__)
        # Calculate path to fixtures: tests/integration/core/catalog -> tests/fixtures/catalogs
        self.fixture_path = os.path.abspath(
            os.path.join(self.base_dir, "..", "..", "..", "fixtures", "catalogs", "functional_layer.json")
        )

    def test_get_packages_for_valid_single_role(self):
        """TC01: Given a valid role, returns list with one role object containing packages."""
        result = get_package_list(self.fixture_path, role="Compiler")

        self.assertIsInstance(result, list)
        self.assertEqual(len(result), 1)
        self.assertEqual(result[0]["roleName"], "Compiler")
        self.assertIn("packages", result[0])
        self.assertIsInstance(result[0]["packages"], list)
        self.assertGreater(len(result[0]["packages"]), 0)

    def test_get_packages_for_all_roles_when_role_is_none(self):
        """TC02: When role is None, returns list with all role objects."""
        result = get_package_list(self.fixture_path, role=None)

        self.assertIsInstance(result, list)
        # Fixture has 6 roles
        expected_roles = [
            "Compiler",
            "K8S Controller",
            "K8S Worker",
            "Login Node",
            "Slurm Controller",
            "Slurm Worker",
        ]
        actual_roles = [r["roleName"] for r in result]
        self.assertCountEqual(actual_roles, expected_roles)

    def test_invalid_role_raises_value_error(self):
        """TC03: Invalid/unknown role raises ValueError with clear message."""
        with self.assertRaises(ValueError) as context:
            get_package_list(self.fixture_path, role="NonExistentRole")

        self.assertIn("NonExistentRole", str(context.exception))

    def test_empty_role_raises_value_error(self):
        """Empty role string is treated as invalid input."""
        with self.assertRaises(ValueError) as context:
            get_package_list(self.fixture_path, role="")

        self.assertIn("non-empty", str(context.exception))

    def test_file_not_found_raises_error(self):
        """TC04: Non-existent file raises FileNotFoundError."""
        with self.assertRaises(FileNotFoundError):
            get_package_list("/nonexistent/path/functional_layer.json")

    def test_malformed_json_raises_error(self):
        """TC05: Malformed JSON raises json.JSONDecodeError."""
        with tempfile.TemporaryDirectory() as tmp_dir:
            malformed_path = os.path.join(tmp_dir, "malformed.json")
            with open(malformed_path, "w", encoding="utf-8") as f:
                f.write("{ invalid json }")

            with self.assertRaises(json.JSONDecodeError):
                get_package_list(malformed_path)

    def test_schema_validation_failure_raises_error(self):
        """TC06: JSON that fails schema validation raises ValidationError."""
        with tempfile.TemporaryDirectory() as tmp_dir:
            # Missing required 'architecture' field for a package item
            invalid_json = {
                "SomeRole": {
                    "packages": [
                        {
                            "package": "firewalld",
                            "type": "rpm",
                            "repo_name": "x86_64_baseos",
                            # Missing 'architecture' field
                        }
                    ]
                }
            }
            json_path = os.path.join(tmp_dir, "invalid_schema.json")
            with open(json_path, "w", encoding="utf-8") as f:
                json.dump(invalid_json, f)

            with self.assertRaises(ValidationError):
                get_package_list(json_path)

    def test_empty_feature_list_returns_empty_list(self):
        """TC07: Empty feature list returns empty list."""
        with tempfile.TemporaryDirectory() as tmp_dir:
            empty_feature_list = FeatureList(features={})
            json_path = os.path.join(tmp_dir, "empty_functional_layer.json")
            serialize_json(empty_feature_list, json_path)

            result = get_package_list(json_path)

            self.assertEqual(result, [])

    def test_package_attributes_are_complete(self):
        """TC08: All package fields are present in the response."""
        result = get_package_list(self.fixture_path, role="Compiler")

        self.assertEqual(len(result), 1)
        packages = result[0]["packages"]
        self.assertGreater(len(packages), 0)

        # Check first package has all required fields
        first_pkg = packages[0]
        required_fields = ["name", "type", "repo_name", "architecture", "uri", "tag"]
        for field in required_fields:
            self.assertIn(field, first_pkg, f"Missing field: {field}")

    def test_package_with_uri_and_tag(self):
        """Verify packages with uri and tag fields are correctly returned."""
        result = get_package_list(self.fixture_path, role="K8S Controller")

        packages = result[0]["packages"]
        # Find a package with tag (image type)
        image_pkgs = [p for p in packages if p["type"] == "image"]
        self.assertGreater(len(image_pkgs), 0)
        # Image packages should have tag
        self.assertIsNotNone(image_pkgs[0].get("tag"))

        # Find a package with uri (tarball type)
        tarball_pkgs = [p for p in packages if p["type"] == "tarball"]
        self.assertGreater(len(tarball_pkgs), 0)
        # Tarball packages should have uri
        self.assertIsNotNone(tarball_pkgs[0].get("uri"))

    def test_role_with_spaces_in_name(self):
        """Verify roles with spaces in name work correctly."""
        result = get_package_list(self.fixture_path, role="K8S Controller")

        self.assertEqual(len(result), 1)
        self.assertEqual(result[0]["roleName"], "K8S Controller")

    def test_all_roles_returns_correct_package_counts(self):
        """Verify each role returns the correct number of packages."""
        result = get_package_list(self.fixture_path, role=None)

        # Verify we have packages for each role
        for role_obj in result:
            self.assertIn("roleName", role_obj)
            self.assertIn("packages", role_obj)
            # Each role should have at least one package
            self.assertGreater(
                len(role_obj["packages"]),
                0,
                f"Role {role_obj['roleName']} has no packages",
            )

    def test_case_insensitive_role_matching_lowercase(self):
        """Verify role matching is case-insensitive with lowercase input."""
        result = get_package_list(self.fixture_path, role="compiler")

        self.assertEqual(len(result), 1)
        # Should return the original role name from JSON
        self.assertEqual(result[0]["roleName"], "Compiler")

    def test_case_insensitive_role_matching_uppercase(self):
        """Verify role matching is case-insensitive with uppercase input."""
        result = get_package_list(self.fixture_path, role="COMPILER")

        self.assertEqual(len(result), 1)
        self.assertEqual(result[0]["roleName"], "Compiler")

    def test_case_insensitive_role_matching_mixed_case(self):
        """Verify role matching is case-insensitive with mixed case input."""
        result = get_package_list(self.fixture_path, role="k8s controller")

        self.assertEqual(len(result), 1)
        self.assertEqual(result[0]["roleName"], "K8S Controller")

    def test_case_insensitive_role_matching_preserves_original_name(self):
        """Verify the returned roleName preserves the original case from JSON."""
        result = get_package_list(self.fixture_path, role="SLURM CONTROLLER")

        self.assertEqual(len(result), 1)
        # Should preserve original case from JSON
        self.assertEqual(result[0]["roleName"], "Slurm Controller")


if __name__ == "__main__":
    unittest.main()


================================================
FILE: build_stream/tests/integration/core/catalog/test_generator_roles.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import os
import sys
import tempfile
import unittest
from jsonschema import ValidationError

HERE = os.path.dirname(__file__)
PROJECT_ROOT = os.path.dirname(os.path.dirname(os.path.dirname(os.path.dirname(HERE))))  # Go up 5 levels to reach build_stream root
if PROJECT_ROOT not in sys.path:
    sys.path.insert(0, PROJECT_ROOT)

from core.catalog.generator import (
    FeatureList,
    serialize_json,
    get_functional_layer_roles_from_file,
)


class TestGetFunctionalLayerRolesFromFile(unittest.TestCase):
    def test_returns_all_role_names_from_fixture(self):
        fixture_path = os.path.abspath(
            os.path.join(os.path.dirname(__file__), "..", "..", "..", "fixtures", "catalogs", "functional_layer.json")
        )

        roles = get_functional_layer_roles_from_file(fixture_path)

        expected_roles = [
            "Compiler",
            "K8S Controller",
            "K8S Worker",
            "Login Node",
            "Slurm Controller",
            "Slurm Worker",
        ]

        self.assertCountEqual(roles, expected_roles)

    def test_empty_feature_list_returns_empty_roles(self):
        with tempfile.TemporaryDirectory() as tmp_dir:
            empty_feature_list = FeatureList(features={})
            json_path = os.path.join(tmp_dir, "functional_layer.json")
            serialize_json(empty_feature_list, json_path)

            roles = get_functional_layer_roles_from_file(json_path)

            self.assertEqual(roles, [])

    def test_invalid_functional_layer_json_fails_schema_validation(self):
        with tempfile.TemporaryDirectory() as tmp_dir:
            # Missing required 'architecture' field for a package item
            invalid_json = {
                "SomeRole": {
                    "packages": [
                        {
                            "package": "firewalld",
                            "type": "rpm",
                            "repo_name": "x86_64_baseos",
                        }
                    ]
                }
            }
            json_path = os.path.join(tmp_dir, "functional_layer_invalid.json")
            with open(json_path, "w") as f:
                import json

                json.dump(invalid_json, f)

            with self.assertRaises(ValidationError):
                get_functional_layer_roles_from_file(json_path)


if __name__ == "__main__":
    unittest.main()


================================================
FILE: build_stream/tests/integration/infra/artifact_store/test_file_artifact_store.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Integration tests for FileArtifactStore."""

import json
import os
import tempfile
import zipfile
from pathlib import Path
from typing import Dict

import pytest

from common.config import load_config
from container import container
from core.artifacts.value_objects import ArtifactKey, ArtifactKind, StoreHint
from core.artifacts.exceptions import (
    ArtifactAlreadyExistsError,
    ArtifactNotFoundError,
    ArtifactValidationError,
)
from infra.artifact_store.file_artifact_store import FileArtifactStore


class TestFileArtifactStoreIntegration:
    """Integration tests for FileArtifactStore with real filesystem."""

    def setup_method(self) -> None:
        """Set up test environment with temporary file store directory."""
        self.temp_dir = tempfile.mkdtemp(prefix="test_file_artifact_store_")
        self.original_env = os.environ.get("BUILD_STREAM_CONFIG_PATH")

        # Create a test config file
        self.config_file = Path(self.temp_dir) / "test_config.ini"
        self.config_file.write_text(f"""[artifact_store]
backend = file_store
working_dir = {self.temp_dir}/working
max_file_size_bytes = 1048576
max_archive_uncompressed_bytes = 10485760
max_archive_entries = 100

[file_store]
base_path = {self.temp_dir}/artifacts
""")

        os.environ["BUILD_STREAM_CONFIG_PATH"] = str(self.config_file)

        # Reload container to pick up new config
        container.unwire()
        container.reset_singletons()

    def teardown_method(self) -> None:
        """Clean up test environment."""
        if self.original_env:
            os.environ["BUILD_STREAM_CONFIG_PATH"] = self.original_env
        else:
            os.environ.pop("BUILD_STREAM_CONFIG_PATH", None)

        # Clean up temp directory
        import shutil
        if Path(self.temp_dir).exists():
            shutil.rmtree(self.temp_dir)

        # Reset container
        container.unwire()
        container.reset_singletons()

    def test_file_artifact_store_is_used_when_enabled_in_config(self) -> None:
        """Test that FileArtifactStore is used when enabled in config."""
        artifact_store = container.artifact_store()
        assert isinstance(artifact_store, FileArtifactStore)

    def test_file_artifact_store_uses_configured_path(self) -> None:
        """Test that FileArtifactStore uses the configured base path."""
        config = load_config()
        expected_path = Path(config.file_store.base_path)

        artifact_store = container.artifact_store()
        assert isinstance(artifact_store, FileArtifactStore)
        assert artifact_store._base_path == expected_path

    def test_file_artifact_store_creates_directories(self) -> None:
        """Test that FileArtifactStore creates directories as needed."""
        artifact_store = container.artifact_store()

        hint = StoreHint(namespace="test", label="test", tags={})
        ref = artifact_store.store(hint, ArtifactKind.FILE, content=b"test data")

        expected_path = artifact_store._base_path / ref.key.value
        assert expected_path.exists()
        assert expected_path.parent.exists()

    def test_store_and_retrieve_file(self) -> None:
        """Test storing and retrieving a file artifact."""
        artifact_store = container.artifact_store()

        hint = StoreHint(namespace="test", label="test-file", tags={})
        content = b"Hello, World!"

        # Store the artifact
        ref = artifact_store.store(hint, ArtifactKind.FILE, content=content)

        # Verify the reference
        assert ref.key.value.startswith("test/")
        assert ref.size_bytes == len(content)
        assert ref.uri.startswith("file://")

        # Retrieve the artifact
        retrieved = artifact_store.retrieve(ref.key, ArtifactKind.FILE)
        assert retrieved == content

    def test_store_and_retrieve_archive_from_file_map(self) -> None:
        """Test storing and retrieving an archive artifact from file map."""
        artifact_store = container.artifact_store()

        hint = StoreHint(namespace="test", label="test-archive", tags={})
        file_map: Dict[str, bytes] = {
            "file1.txt": b"Content of file 1",
            "subdir/file2.txt": b"Content of file 2",
        }

        # Store the archive
        ref = artifact_store.store(hint, ArtifactKind.ARCHIVE, file_map=file_map)

        # Verify the reference
        assert ref.key.value.startswith("test/")
        assert ref.size_bytes > 0
        assert ref.uri.startswith("file://")

        # Retrieve the archive to a temporary directory
        with tempfile.TemporaryDirectory() as extract_dir:
            extracted_path = artifact_store.retrieve(
                ref.key, ArtifactKind.ARCHIVE, destination=Path(extract_dir)
            )

            # Verify extracted files
            assert (extracted_path / "file1.txt").exists()
            assert (extracted_path / "subdir" / "file2.txt").exists()

            assert (extracted_path / "file1.txt").read_bytes() == b"Content of file 1"
            assert (extracted_path / "subdir" / "file2.txt").read_bytes() == b"Content of file 2"

    def test_store_and_retrieve_archive_from_directory(self) -> None:
        """Test storing and retrieving an archive artifact from directory."""
        artifact_store = container.artifact_store()

        # Create a temporary directory with files
        with tempfile.TemporaryDirectory() as source_dir:
            source_path = Path(source_dir)
            (source_path / "file1.txt").write_bytes(b"Content of file 1")
            (source_path / "subdir").mkdir()
            (source_path / "subdir" / "file2.txt").write_bytes(b"Content of file 2")

            hint = StoreHint(namespace="test", label="dir-archive", tags={})

            # Store the archive
            ref = artifact_store.store(hint, ArtifactKind.ARCHIVE, source_directory=source_path)

            # Retrieve the archive to a temporary directory
            with tempfile.TemporaryDirectory() as extract_dir:
                extracted_path = artifact_store.retrieve(
                    ref.key, ArtifactKind.ARCHIVE, destination=Path(extract_dir)
                )

                # Verify extracted files
                assert (extracted_path / "file1.txt").exists()
                assert (extracted_path / "subdir" / "file2.txt").exists()

    def test_exists_and_delete(self) -> None:
        """Test exists and delete operations."""
        artifact_store = container.artifact_store()

        hint = StoreHint(namespace="test", label="exists-test", tags={})
        content = b"test content"

        # Store an artifact
        ref = artifact_store.store(hint, ArtifactKind.FILE, content=content)

        # Test exists
        assert artifact_store.exists(ref.key) is True

        # Test exists for non-existent artifact
        non_existent_key = ArtifactKey("test/non-existent/file.bin")
        assert artifact_store.exists(non_existent_key) is False

        # Delete the artifact
        assert artifact_store.delete(ref.key) is True
        assert artifact_store.exists(ref.key) is False

        # Try to delete non-existent artifact
        assert artifact_store.delete(non_existent_key) is False

    def test_duplicate_store_raises_error(self) -> None:
        """Test that storing duplicate artifacts raises an error."""
        artifact_store = container.artifact_store()

        hint = StoreHint(namespace="test", label="duplicate", tags={})
        content = b"test content"

        # Store first artifact
        ref1 = artifact_store.store(hint, ArtifactKind.FILE, content=content)

        # Try to store with same hint (should generate same key)
        with pytest.raises(ArtifactAlreadyExistsError):
            artifact_store.store(hint, ArtifactKind.FILE, content=b"different content")

    def test_retrieve_nonexistent_raises_error(self) -> None:
        """Test that retrieving non-existent artifact raises an error."""
        artifact_store = container.artifact_store()

        non_existent_key = ArtifactKey("test/non-existent/file.bin")

        with pytest.raises(ArtifactNotFoundError):
            artifact_store.retrieve(non_existent_key, ArtifactKind.FILE)

    def test_content_type_validation(self) -> None:
        """Test that content types are validated."""
        artifact_store = container.artifact_store()

        hint = StoreHint(namespace="test", label="content-type", tags={})

        # Valid content type
        ref = artifact_store.store(
            hint, ArtifactKind.FILE, content=b"test", content_type="application/json"
        )
        assert ref is not None

        # Invalid content type
        with pytest.raises(ArtifactValidationError, match="Content type not allowed"):
            artifact_store.store(
                hint, ArtifactKind.FILE, content=b"test", content_type="invalid/type"
            )

    def test_size_validation(self) -> None:
        """Test that artifact sizes are validated."""
        artifact_store = container.artifact_store()

        hint = StoreHint(namespace="test", label="size-test", tags={})

        # Valid size (within limit)
        small_content = b"x" * 1000
        ref = artifact_store.store(hint, ArtifactKind.FILE, content=small_content)
        assert ref is not None

        # Invalid size (exceeds limit from config)
        large_content = b"x" * 2_000_000  # 2MB, exceeds our 1MB test config
        with pytest.raises(ArtifactValidationError, match="Artifact size.*exceeds maximum"):
            artifact_store.store(hint, ArtifactKind.FILE, content=large_content)

    def test_deterministic_key_generation(self) -> None:
        """Test that key generation is deterministic for same hints."""
        artifact_store = container.artifact_store()

        hint = StoreHint(
            namespace="test",
            label="deterministic",
            tags={"env": "test", "version": "1.0"}
        )

        # Generate keys multiple times
        key1 = artifact_store.generate_key(hint, ArtifactKind.FILE)
        key2 = artifact_store.generate_key(hint, ArtifactKind.FILE)
        key3 = artifact_store.generate_key(hint, ArtifactKind.ARCHIVE)

        # Same hints should generate same keys for same kind
        assert key1.value == key2.value

        # Different kinds should have different extensions
        assert key1.value.endswith(".bin")
        assert key3.value.endswith(".zip")

    def test_key_format_validation(self) -> None:
        """Test that generated keys follow expected format."""
        artifact_store = container.artifact_store()

        hint = StoreHint(
            namespace="test-ns",
            label="test-label",
            tags={"key": "value"}
        )

        key = artifact_store.generate_key(hint, ArtifactKind.FILE)

        # Key format: {namespace}/{tag_hash}/{label}.{ext}
        parts = key.value.split("/")
        assert len(parts) == 3
        assert parts[0] == "test-ns"
        assert len(parts[1]) == 12  # SHA-256 hash truncated to 12 chars
        assert parts[2] == "test-label.bin"

    def test_file_cleanup_on_delete(self) -> None:
        """Test that empty directories are cleaned up on delete."""
        artifact_store = container.artifact_store()

        hint = StoreHint(namespace="test", label="cleanup", tags={})
        content = b"test content"

        # Store an artifact
        ref = artifact_store.store(hint, ArtifactKind.FILE, content=content)
        artifact_path = artifact_store._base_path / ref.key.value

        # Verify file and parent directory exist
        assert artifact_path.exists()
        assert artifact_path.parent.exists()

        # Delete the artifact
        artifact_store.delete(ref.key)

        # Verify file is deleted and empty parent directory is cleaned up
        assert not artifact_path.exists()
        # Note: parent directory cleanup is implementation-specific

    def test_concurrent_operations(self) -> None:
        """Test concurrent store operations."""
        import threading

        artifact_store = container.artifact_store()
        results = []
        errors = []

        def store_artifact(index: int):
            try:
                hint = StoreHint(
                    namespace=f"thread-{index}",
                    label=f"artifact-{index}",
                    tags={}
                )
                ref = artifact_store.store(hint, ArtifactKind.FILE, content=f"data-{index}".encode())
                results.append(ref)
            except Exception as e:
                errors.append(e)

        # Create multiple threads storing different artifacts
        threads = []
        for i in range(5):
            thread = threading.Thread(target=store_artifact, args=(i,))
            threads.append(thread)
            thread.start()

        # Wait for all threads to complete
        for thread in threads:
            thread.join()

        # Verify all operations succeeded
        assert len(errors) == 0
        assert len(results) == 5

        # Verify all artifacts can be retrieved
        for ref in results:
            retrieved = artifact_store.retrieve(ref.key, ArtifactKind.FILE)
            assert retrieved is not None


class TestFileArtifactStoreConfiguration:
    """Tests for FileArtifactStore configuration handling."""

    def test_missing_config_fallback(self) -> None:
        """Test fallback behavior when config is missing."""
        # Remove config file temporarily
        original_config = os.environ.get("BUILD_STREAM_CONFIG_PATH")
        os.environ.pop("BUILD_STREAM_CONFIG_PATH", None)

        try:
            # Reload container
            container.unwire()
            container.reset_singletons()

            # Should fall back to defaults
            artifact_store = container.artifact_store()
            assert isinstance(artifact_store, FileArtifactStore)
            assert str(artifact_store._base_path) == "/opt/omnia/build_stream_root/artifacts"
        finally:
            # Restore config
            if original_config:
                os.environ["BUILD_STREAM_CONFIG_PATH"] = original_config
            container.unwire()
            container.reset_singletons()

    def test_invalid_config_handling(self) -> None:
        """Test handling of invalid configuration."""
        with tempfile.TemporaryDirectory() as temp_dir:
            config_file = Path(temp_dir) / "invalid_config.ini"
            config_file.write_text("""[artifact_store]
backend = file_store
working_dir = /tmp/test

# Missing file_store section
""")

            original_config = os.environ.get("BUILD_STREAM_CONFIG_PATH")
            os.environ["BUILD_STREAM_CONFIG_PATH"] = str(config_file)

            try:
                # Should fall back to defaults when config is invalid
                container.unwire()
                container.reset_singletons()

                artifact_store = container.artifact_store()
                assert isinstance(artifact_store, FileArtifactStore)
                # Should use fallback path
                assert str(artifact_store._base_path) == "/opt/omnia/build_stream_root/artifacts"
            finally:
                if original_config:
                    os.environ["BUILD_STREAM_CONFIG_PATH"] = original_config
                container.unwire()
                container.reset_singletons()


================================================
FILE: build_stream/tests/integration/infra/db/conftest.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Fixtures for database integration tests."""

import os
from datetime import datetime, timezone

import pytest

from core.jobs.value_objects import (
    ClientId,
    CorrelationId,
    IdempotencyKey,
    JobId,
    JobState,
    RequestFingerprint,
    StageName,
    StageState,
)


@pytest.fixture
def sample_job() -> JobId:
    """Create a sample job ID for testing."""
    return JobId("12345678-1234-5678-9abc-123456789abc")


@pytest.fixture
def sample_client_id() -> ClientId:
    """Create a sample client ID for testing."""
    return ClientId("test-client")


@pytest.fixture
def sample_idempotency_key() -> IdempotencyKey:
    """Create a sample idempotency key for testing."""
    return IdempotencyKey("test-key-123")


@pytest.fixture
def sample_correlation_id() -> CorrelationId:
    """Create a sample correlation ID for testing."""
    return CorrelationId("corr-12345678-1234-5678-9abc-123456789abc")


@pytest.fixture
def sample_request_fingerprint() -> RequestFingerprint:
    """Create a sample request fingerprint for testing."""
    return RequestFingerprint("a" * 64)  # Valid SHA-256 hex


@pytest.fixture
def sample_timestamp() -> datetime:
    """Create a sample timestamp for testing."""
    return datetime(2026, 1, 26, 10, 0, tzinfo=timezone.utc)


@pytest.fixture
def sample_stage_names() -> list[StageName]:
    """Create sample stage names for testing."""
    return [
        StageName("parse-catalog"),
        StageName("generate-input-files"),
        StageName("create-local-repository"),
        StageName("update-local-repository"),
        StageName("create-image-repository"),
        StageName("build-image-x86_64"),
        StageName("build-image-aarch64"),
        StageName("validate-image"),
        StageName("validate-image-on-test"),
        StageName("promote"),
    ]


@pytest.fixture
def sample_job_states() -> list[JobState]:
    """Create sample job states for testing."""
    return list(JobState)


@pytest.fixture
def sample_stage_states() -> list[StageState]:
    """Create sample stage states for testing."""
    return list(StageState)


================================================
FILE: build_stream/tests/integration/infra/db/test_sql_repositories.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Integration tests for SQL repositories against PostgreSQL."""

import os
import uuid
from datetime import datetime, timezone
from typing import Generator
from unittest.mock import patch

import pytest
from sqlalchemy import create_engine, text
from sqlalchemy.orm import Session

from core.jobs.entities.audit import AuditEvent
from core.jobs.entities.idempotency import IdempotencyRecord
from core.jobs.entities.job import Job
from core.jobs.entities.stage import Stage
from core.jobs.exceptions import OptimisticLockError
from core.jobs.value_objects import (
    ClientId,
    CorrelationId,
    IdempotencyKey,
    JobId,
    JobState,
    RequestFingerprint,
    StageName,
    StageState,
)
from infra.db.models import Base
from infra.db.repositories import (
    SqlAuditEventRepository,
    SqlIdempotencyRepository,
    SqlJobRepository,
    SqlStageRepository,
)
from infra.db.session import get_db_session


@pytest.fixture(scope="session")
def pg_url() -> str:
    """Get PostgreSQL URL from environment or use testcontainers."""
    # First try to get from environment (for manual testing)
    pg_url = os.getenv("TEST_DATABASE_URL")
    if pg_url:
        yield pg_url
        return

    # Fall back to testcontainers if available
    try:
        from testcontainers.postgres import PostgresContainer

        with PostgresContainer("postgres:15") as postgres:
            # Wait for container to be ready
            postgres.get_connection_url()
            yield postgres.get_connection_url()
            return
    except ImportError:
        pytest.skip("testcontainers-postgres not installed and TEST_DATABASE_URL not set")


@pytest.fixture
def db_engine(pg_url: str) -> Generator:
    """Create a fresh database for each test."""
    engine = create_engine(pg_url)
    Base.metadata.create_all(engine)
    yield engine
    Base.metadata.drop_all(engine)


@pytest.fixture
def db_session(db_engine) -> Generator[Session, None, None]:
    """Create a database session for each test."""
    with db_engine.connect() as connection:
        transaction = connection.begin()
        session = Session(bind=connection)
        yield session
        session.close()
        transaction.rollback()


@pytest.fixture
def job_repo(db_session: Session) -> SqlJobRepository:
    """Create SqlJobRepository instance."""
    return SqlJobRepository(db_session)


@pytest.fixture
def stage_repo(db_session: Session) -> SqlStageRepository:
    """Create SqlStageRepository instance."""
    return SqlStageRepository(db_session)


@pytest.fixture
def idempotency_repo(db_session: Session) -> SqlIdempotencyRepository:
    """Create SqlIdempotencyRepository instance."""
    return SqlIdempotencyRepository(db_session)


@pytest.fixture
def audit_repo(db_session: Session) -> SqlAuditEventRepository:
    """Create SqlAuditEventRepository instance."""
    return SqlAuditEventRepository(db_session)


class TestSqlJobRepository:
    """Test SqlJobRepository against PostgreSQL."""

    def test_save_and_find_by_id(self, job_repo: SqlJobRepository) -> None:
        """Save a job and retrieve it by ID."""
        job = Job(
            job_id=JobId("12345678-1234-5678-9abc-123456789abc"),
            client_id=ClientId("test-client"),
            request_client_id="request-123",
            client_name="Test Client",
            job_state=JobState.CREATED,
        )

        job_repo.save(job)
        found = job_repo.find_by_id(job.job_id)

        assert found is not None
        assert str(found.job_id) == str(job.job_id)
        assert str(found.client_id) == str(job.client_id)
        assert found.request_client_id == job.request_client_id
        assert found.client_name == job.client_name
        assert found.job_state == job.job_state
        assert found.version == 1

    def test_exists(self, job_repo: SqlJobRepository) -> None:
        """Check if a job exists."""
        job_id = JobId("12345678-1234-5678-9abc-123456789abc")
        assert not job_repo.exists(job_id)

        job = Job(
            job_id=job_id,
            client_id=ClientId("test-client"),
            request_client_id="request-123",
        )
        job_repo.save(job)

        assert job_repo.exists(job_id)

    def test_update_with_optimistic_locking(self, job_repo: SqlJobRepository) -> None:
        """Test optimistic locking on update."""
        job = Job(
            job_id=JobId("12345678-1234-5678-9abc-123456789abc"),
            client_id=ClientId("test-client"),
            request_client_id="request-123",
            job_state=JobState.CREATED,
        )
        job_repo.save(job)

        # Simulate concurrent update
        job.start()  # version becomes 2
        job_repo.save(job)

        # Try to save with stale version
        stale_job = Job(
            job_id=job.job_id,
            client_id=ClientId("test-client"),
            request_client_id="request-123",
            job_state=JobState.FAILED,  # Different state
            version=1,  # Stale version
        )

        with pytest.raises(OptimisticLockError) as exc_info:
            job_repo.save(stale_job)

        assert "Version conflict for Job" in str(exc_info.value)
        assert exc_info.value.expected_version == 0  # stale version - 1
        assert exc_info.value.actual_version == 2

    def test_find_by_id_not_found(self, job_repo: SqlJobRepository) -> None:
        """Return None when job doesn't exist."""
        found = job_repo.find_by_id(JobId("00000000-0000-0000-0000-000000000000"))
        assert found is None


class TestSqlStageRepository:
    """Test SqlStageRepository against PostgreSQL."""

    def test_save_and_find_by_job_and_name(
        self, stage_repo: SqlStageRepository, job_repo: SqlJobRepository
    ) -> None:
        """Save a stage and retrieve it."""
        # First create a job to satisfy foreign key constraint
        job = Job(
            job_id=JobId("12345678-1234-5678-9abc-123456789abc"),
            client_id=ClientId("test-client"),
            request_client_id="request-123",
        )
        job_repo.save(job)
        
        stage = Stage(
            job_id=JobId("12345678-1234-5678-9abc-123456789abc"),
            stage_name=StageName("parse-catalog"),
            stage_state=StageState.IN_PROGRESS,
            attempt=1,
        )

        stage_repo.save(stage)
        found = stage_repo.find_by_job_and_name(stage.job_id, stage.stage_name)

        assert found is not None
        assert str(found.job_id) == str(stage.job_id)
        assert str(found.stage_name) == str(stage.stage_name)
        assert found.stage_state == stage.stage_state
        assert found.attempt == stage.attempt

    def test_save_all_and_find_all_by_job(
        self, stage_repo: SqlStageRepository, job_repo: SqlJobRepository
    ) -> None:
        """Save multiple stages and retrieve all for a job."""
        job_id = JobId("12345678-1234-5678-9abc-123456789abc")
        
        # First create a job to satisfy foreign key constraint
        job = Job(
            job_id=job_id,
            client_id=ClientId("test-client"),
            request_client_id="request-123",
        )
        job_repo.save(job)
        
        stages = [
            Stage(
                job_id=job_id,
                stage_name=StageName("parse-catalog"),
                stage_state=StageState.COMPLETED,
            ),
            Stage(
                job_id=job_id,
                stage_name=StageName("generate-input-files"),
                stage_state=StageState.PENDING,
            ),
            Stage(
                job_id=job_id,
                stage_name=StageName("create-local-repository"),
                stage_state=StageState.PENDING,
            ),
        ]

        stage_repo.save_all(stages)
        found_stages = stage_repo.find_all_by_job(job_id)

        assert len(found_stages) == 3
        stage_names = [str(s.stage_name) for s in found_stages]
        assert "parse-catalog" in stage_names
        assert "generate-input-files" in stage_names
        assert "create-local-repository" in stage_names
        # Verify ordering by stage_name
        assert stage_names == sorted(stage_names)

    def test_update_with_optimistic_locking(
        self, stage_repo: SqlStageRepository, job_repo: SqlJobRepository
    ) -> None:
        """Test optimistic locking on stage update."""
        # First create a job to satisfy foreign key constraint
        job = Job(
            job_id=JobId("12345678-1234-5678-9abc-123456789abc"),
            client_id=ClientId("test-client"),
            request_client_id="request-123",
        )
        job_repo.save(job)
        
        stage = Stage(
            job_id=JobId("12345678-1234-5678-9abc-123456789abc"),
            stage_name=StageName("parse-catalog"),
            stage_state=StageState.PENDING,
            version=1,
        )
        stage_repo.save(stage)

        # Update successfully
        stage.start()  # version becomes 2
        stage_repo.save(stage)

        # Try to save with stale version
        stale_stage = Stage(
            job_id=stage.job_id,
            stage_name=stage.stage_name,
            stage_state=StageState.FAILED,
            version=1,  # Stale
        )

        with pytest.raises(OptimisticLockError) as exc_info:
            stage_repo.save(stale_stage)

        assert "Version conflict for Stage" in str(exc_info.value)


class TestSqlIdempotencyRepository:
    """Test SqlIdempotencyRepository against PostgreSQL."""

    def test_save_and_find_by_key(
        self, idempotency_repo: SqlIdempotencyRepository
    ) -> None:
        """Save and retrieve idempotency record."""
        record = IdempotencyRecord(
            idempotency_key=IdempotencyKey("unique-key-123"),
            job_id=JobId("12345678-1234-5678-9abc-123456789abc"),
            request_fingerprint=RequestFingerprint("a" * 64),
            client_id=ClientId("test-client"),
            created_at=datetime(2026, 1, 26, 10, 0),
            expires_at=datetime(2026, 1, 26, 11, 0),
        )

        idempotency_repo.save(record)
        found = idempotency_repo.find_by_key(record.idempotency_key)

        assert found is not None
        assert str(found.idempotency_key) == str(record.idempotency_key)
        assert str(found.job_id) == str(record.job_id)
        assert str(found.request_fingerprint) == str(record.request_fingerprint)
        assert str(found.client_id) == str(record.client_id)

    def test_find_by_key_not_found(
        self, idempotency_repo: SqlIdempotencyRepository
    ) -> None:
        """Return None when key doesn't exist."""
        found = idempotency_repo.find_by_key(IdempotencyKey("non-existent"))
        assert found is None


class TestSqlAuditEventRepository:
    """Test SqlAuditEventRepository against PostgreSQL."""

    def test_save_and_find_by_job(self, audit_repo: SqlAuditEventRepository) -> None:
        """Save audit events and retrieve all for a job."""
        job_id = JobId("12345678-1234-5678-9abc-123456789abc")
        events = [
            AuditEvent(
                event_id=str(uuid.uuid4()),
                job_id=job_id,
                event_type="job_created",
                correlation_id=CorrelationId("11111111-1111-1111-1111-111111111111"),
                client_id=ClientId("test-client"),
                timestamp=datetime(2026, 1, 26, 10, 0),
            ),
            AuditEvent(
                event_id=str(uuid.uuid4()),
                job_id=job_id,
                event_type="stage_completed",
                correlation_id=CorrelationId("22222222-2222-2222-2222-222222222222"),
                client_id=ClientId("test-client"),
                timestamp=datetime(2026, 1, 26, 10, 30),
                details={"stage": "parse-catalog"},
            ),
        ]

        for event in events:
            audit_repo.save(event)

        found_events = audit_repo.find_by_job(job_id)

        assert len(found_events) == 2
        event_types = [e.event_type for e in found_events]
        assert "job_created" in event_types
        assert "stage_completed" in event_types
        # Verify chronological order
        assert found_events[0].timestamp < found_events[1].timestamp


class TestDatabaseConstraints:
    """Test database constraints and relationships."""

    def test_foreign_key_cascade_delete(
        self, db_session: Session, job_repo: SqlJobRepository, stage_repo: SqlStageRepository
    ) -> None:
        """Test that deleting a job cascades to stages."""
        job = Job(
            job_id=JobId("12345678-1234-5678-9abc-123456789abc"),
            client_id=ClientId("test-client"),
            request_client_id="request-123",
        )
        job_repo.save(job)

        stage = Stage(
            job_id=job.job_id,
            stage_name=StageName("parse-catalog"),
            stage_state=StageState.PENDING,
        )
        stage_repo.save(stage)

        # Verify stage exists
        found = stage_repo.find_by_job_and_name(job.job_id, stage.stage_name)
        assert found is not None

        # Delete the job (simulating cascade)
        # Use a transaction to test the cascade
        db_session.begin_nested()
        db_session.execute(text("DELETE FROM jobs WHERE job_id = :job_id"), {"job_id": str(job.job_id)})
        db_session.flush()  # Ensure the delete is executed
        
        # Stage should be deleted by cascade
        found = stage_repo.find_by_job_and_name(job.job_id, stage.stage_name)
        assert found is None
        
        # Rollback the nested transaction
        db_session.rollback()

    def test_unique_constraint_on_stages(
        self, db_session: Session, stage_repo: SqlStageRepository, job_repo: SqlJobRepository
    ) -> None:
        """Test that stage_name is unique within a job."""
        job_id = JobId("12345678-1234-5678-9abc-123456789abc")
        
        # First create a job to satisfy foreign key constraint
        job = Job(
            job_id=job_id,
            client_id=ClientId("test-client"),
            request_client_id="request-123",
        )
        job_repo.save(job)
        
        stage = Stage(
            job_id=job_id,
            stage_name=StageName("parse-catalog"),
            stage_state=StageState.PENDING,
        )
        stage_repo.save(stage)

        # Try to insert duplicate (update with correct version)
        duplicate = Stage(
            job_id=job_id,
            stage_name=StageName("parse-catalog"),
            stage_state=StageState.IN_PROGRESS,
            version=2,  # Incremented version for update
        )

        # Should update instead of error due to upsert logic
        stage_repo.save(duplicate)
        found = stage_repo.find_by_job_and_name(job_id, StageName("parse-catalog"))
        assert found.stage_state == StageState.IN_PROGRESS


================================================
FILE: build_stream/tests/mocks/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Mock implementations for testing."""

from .mock_vault_client import MockVaultClient

__all__ = ["MockVaultClient"]


================================================
FILE: build_stream/tests/mocks/mock_jwt_handler.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Mock implementation of JWTHandler for testing."""

import base64
import json
import uuid
from datetime import datetime, timedelta, timezone
from typing import List

from api.auth.jwt_handler import TokenData


class MockJWTHandler:
    """In-memory mock implementation of JWTHandler for testing.

    This mock provides the same interface as JWTHandler but creates
    simple mock tokens without requiring actual RSA keys.
    """

    DEFAULT_EXPIRE_MINUTES = 60
    DEFAULT_ISSUER = "build-stream-api"
    DEFAULT_AUDIENCE = "build-stream-api"

    def __init__(
        self,
        access_token_expire_minutes: int = DEFAULT_EXPIRE_MINUTES,
        issuer: str = DEFAULT_ISSUER,
        audience: str = DEFAULT_AUDIENCE,
    ):
        """Initialize the mock JWT handler.

        Args:
            access_token_expire_minutes: Token expiration time in minutes.
            issuer: Token issuer claim.
            audience: Token audience claim.
        """
        self.access_token_expire_minutes = access_token_expire_minutes
        self.issuer = issuer
        self.audience = audience
        self._tokens: dict = {}

    def create_access_token(
        self,
        client_id: str,
        client_name: str,
        scopes: List[str],
    ) -> tuple[str, int]:
        """Create a mock JWT access token.

        Args:
            client_id: The client identifier (becomes 'sub' claim).
            client_name: Human-readable client name.
            scopes: List of granted scopes.

        Returns:
            Tuple of (access_token, expires_in_seconds).
        """
        now = datetime.now(timezone.utc)
        expires_delta = timedelta(minutes=self.access_token_expire_minutes)
        expires_at = now + expires_delta
        token_id = str(uuid.uuid4())

        # Create mock JWT structure (header.payload.signature)
        header = {
            "alg": "RS256",
            "typ": "JWT",
            "kid": "mock-key-id",
        }
        payload = {
            "iss": self.issuer,
            "sub": client_id,
            "aud": self.audience,
            "iat": int(now.timestamp()),
            "exp": int(expires_at.timestamp()),
            "nbf": int(now.timestamp()),
            "jti": token_id,
            "scope": " ".join(scopes),
            "client_name": client_name,
        }

        # Create base64url encoded parts
        header_b64 = base64.urlsafe_b64encode(
            json.dumps(header).encode()
        ).decode().rstrip("=")
        payload_b64 = base64.urlsafe_b64encode(
            json.dumps(payload).encode()
        ).decode().rstrip("=")
        # Mock signature
        signature_b64 = base64.urlsafe_b64encode(
            f"mock_signature_{token_id}".encode()
        ).decode().rstrip("=")

        token = f"{header_b64}.{payload_b64}.{signature_b64}"

        # Store token for validation
        self._tokens[token] = {
            "payload": payload,
            "client_id": client_id,
            "client_name": client_name,
            "scopes": scopes,
            "issued_at": now,
            "expires_at": expires_at,
            "token_id": token_id,
        }

        return token, int(expires_delta.total_seconds())

    def validate_token(self, token: str) -> TokenData:
        """Validate a mock JWT access token and extract claims.

        Args:
            token: The JWT token string.

        Returns:
            TokenData with decoded claims.

        Raises:
            ValueError: If token is invalid or not found.
        """
        if token not in self._tokens:
            raise ValueError("Invalid token")

        token_data = self._tokens[token]

        if datetime.now(timezone.utc) > token_data["expires_at"]:
            raise ValueError("Token has expired")

        return TokenData(
            client_id=token_data["client_id"],
            client_name=token_data["client_name"],
            scopes=token_data["scopes"],
            issued_at=token_data["issued_at"],
            expires_at=token_data["expires_at"],
            token_id=token_data["token_id"],
        )

    def reset(self) -> None:
        """Reset the mock to initial state (clear all tokens)."""
        self._tokens.clear()


================================================
FILE: build_stream/tests/mocks/mock_vault_client.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Mock implementation of VaultClient for testing."""

from typing import Any, Dict, Optional

from api.auth.password_handler import hash_password


class MockVaultClient:
    """In-memory mock implementation of VaultClient for testing.

    This mock provides the same interface as VaultClient but stores
    all data in memory, eliminating the need for Ansible Vault during tests.
    """

    DEFAULT_TEST_USERNAME = "test_registrar"
    DEFAULT_TEST_PASSWORD = "test_password"

    def __init__(
        self,
        auth_username: Optional[str] = None,
        auth_password: Optional[str] = None,
    ):
        """Initialize the mock vault client.

        Args:
            auth_username: Username for registration auth. Defaults to test_registrar.
            auth_password: Password for registration auth. Defaults to test_password.
        """
        username = auth_username or self.DEFAULT_TEST_USERNAME
        password = auth_password or self.DEFAULT_TEST_PASSWORD

        self._auth_config: Dict[str, Any] = {
            "auth_registration": {
                "username": username,
                "password_hash": hash_password(password),
            }
        }
        self._oauth_clients: Dict[str, Dict[str, Any]] = {}

    def get_auth_config(self) -> Dict[str, Any]:
        """Get authentication configuration.

        Returns:
            Auth configuration dictionary.
        """
        return self._auth_config

    def get_oauth_clients(self) -> Dict[str, Any]:
        """Get all registered OAuth clients.

        Returns:
            Dictionary of OAuth clients.
        """
        return self._oauth_clients.copy()

    def save_oauth_client(
        self,
        client_id: str,
        client_data: Dict[str, Any],
    ) -> None:
        """Save a new OAuth client.

        Args:
            client_id: The client identifier.
            client_data: Client data to store.
        """
        self._oauth_clients[client_id] = client_data

    def get_active_client_count(self) -> int:
        """Get the count of active registered clients.

        Returns:
            Number of active clients.
        """
        return sum(
            1 for c in self._oauth_clients.values()
            if c.get("is_active", True)
        )

    def client_exists(self, client_name: str) -> bool:
        """Check if a client with the given name already exists.

        Args:
            client_name: The client name to check.

        Returns:
            True if client exists, False otherwise.
        """
        for client_data in self._oauth_clients.values():
            if client_data.get("client_name") == client_name:
                return True
        return False

    def reset(self) -> None:
        """Reset the mock to initial state (clear all clients)."""
        self._oauth_clients.clear()

    def add_test_client(
        self,
        client_id: str = "bld_test_client_id",
        client_name: str = "test-client",
        is_active: bool = True,
    ) -> None:
        """Add a test client for testing scenarios.

        Args:
            client_id: Client ID to use.
            client_name: Client name to use.
            is_active: Whether the client is active.
        """
        self._oauth_clients[client_id] = {
            "client_name": client_name,
            "client_secret_hash": hash_password("test_secret"),
            "description": "Test client",
            "allowed_scopes": ["catalog:read"],
            "created_at": "2026-01-27T00:00:00Z",
            "is_active": is_active,
        }


================================================
FILE: build_stream/tests/others/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Other tests that don't fit into specific categories."""


================================================
FILE: build_stream/tests/others/test_dependency_rules.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Tests to enforce design constraints and dependency injection rules.

These tests ensure that API routes use FastAPI's dependency injection
instead of directly accessing the container, which would cause production
code to use InMemory repositories instead of SQL repositories.
"""

import ast
from pathlib import Path
from typing import List, Tuple

import pytest


def get_python_files(directory: str, pattern: str = "*.py") -> List[Path]:
    """Get all Python files in directory matching pattern."""
    path = Path(directory)
    if not path.exists():
        return []
    return list(path.rglob(pattern))


def check_forbidden_imports(file_path: Path, forbidden_modules: List[str]) -> List[str]:
    """Check if file contains forbidden imports.

    Returns:
        List of forbidden import statements found.
    """
    violations = []

    try:
        with open(file_path, 'r', encoding='utf-8') as f:
            tree = ast.parse(f.read(), filename=str(file_path))
    except (SyntaxError, UnicodeDecodeError):
        return []  # Skip files that can't be parsed

    for node in ast.walk(tree):
        # Check "from container import ..."
        if isinstance(node, ast.ImportFrom):
            if node.module in forbidden_modules:
                violations.append(f"from {node.module} import ...")

        # Check "import container"
        if isinstance(node, ast.Import):
            for alias in node.names:
                if alias.name in forbidden_modules:
                    violations.append(f"import {alias.name}")

    return violations


def check_forbidden_calls(file_path: Path, forbidden_patterns: List[str]) -> List[Tuple[int, str]]:
    """Check if file contains forbidden function/method calls.

    Returns:
        List of (line_number, code_snippet) tuples for violations.
    """
    violations = []

    try:
        with open(file_path, 'r', encoding='utf-8') as f:
            lines = f.readlines()
        for line_num, line in enumerate(lines, start=1):
            for pattern in forbidden_patterns:
                if pattern in line and not line.strip().startswith('#'):
                    violations.append((line_num, line.strip()))
    except (UnicodeDecodeError, IOError):
        return []

    return violations


class TestDesignRules:
    """Enforce design constraints across the codebase."""

    def test_api_routes_dont_import_container(self):
        """API routes MUST use dependency injection, not direct container access.

        This test prevents the bug where routes use container.X() which returns
        InMemory repositories instead of SQL repositories, causing data loss.

        Related: Issue #1874 - Generate Input files hangs
        """
        # Get all route files in api/
        api_dir = Path(__file__).parent.parent.parent / "api"
        route_files = get_python_files(str(api_dir), "routes.py")

        assert len(route_files) > 0, "No route files found - check test setup"

        violations = {}
        for route_file in route_files:
            imports = check_forbidden_imports(route_file, ["container"])
            if imports:
                violations[str(route_file.relative_to(api_dir.parent))] = imports

        assert not violations, (
            "\nERROR: API routes importing 'container' (should use Depends() instead):\n"
            + "\n".join(
                f"  {file}:\n    " + "\n    ".join(imports)
                for file, imports in violations.items()
            )
            + "\n\nINFO: Fix: Use FastAPI dependency injection via Depends(get_X_use_case)"
        )

    def test_api_routes_dont_call_container_methods(self):
        """API routes MUST NOT call container methods directly.

        Even if container is imported for other reasons, routes should not
        call container.X() to instantiate services or use cases.
        """
        api_dir = Path(__file__).parent.parent.parent / "api"
        route_files = get_python_files(str(api_dir), "routes.py")

        assert len(route_files) > 0, "No route files found - check test setup"

        forbidden_patterns = [
            "container.",
            "_get_container()",
        ]

        violations = {}
        for route_file in route_files:
            calls = check_forbidden_calls(route_file, forbidden_patterns)
            if calls:
                violations[str(route_file.relative_to(api_dir.parent))] = calls

        assert not violations, (
            "\nERROR: API routes calling container methods directly:\n"
            + "\n".join(
                f"  {file}:\n    " + "\n    ".join(
                    f"Line {line_num}: {code}"
                    for line_num, code in calls
                )
                for file, calls in violations.items()
            )
            + "\n\nINFO: Fix: Use dependency injection via Depends()"
        )

    def test_use_cases_dont_import_infra_db(self):
        """Use cases MUST NOT depend on infrastructure layer (Clean Architecture).

        Use cases should depend on repository interfaces, not concrete
        database implementations. This ensures proper layering.
        """
        orchestrator_dir = Path(__file__).parent.parent.parent / "orchestrator"
        if not orchestrator_dir.exists():
            pytest.skip("Orchestrator directory not found")

        use_case_files = get_python_files(str(orchestrator_dir), "*.py")

        violations = {}
        for uc_file in use_case_files:
            imports = check_forbidden_imports(uc_file, ["infra.db"])
            if imports:
                violations[str(uc_file.relative_to(orchestrator_dir.parent))] = imports

        assert not violations, (
            "\nERROR: Use cases importing infrastructure layer (violates Clean Architecture):\n"
            + "\n".join(
                f"  {file}:\n    " + "\n    ".join(imports)
                for file, imports in violations.items()
            )
            + "\n\nINFO: Fix: Use repository interfaces, inject concrete implementations via DI"
        )

    def test_core_domain_has_no_infra_dependencies(self):
        """Core domain MUST NOT depend on infrastructure or API layers.

        The core domain (entities, value objects, exceptions) should be
        pure business logic with no external dependencies.
        """
        core_dir = Path(__file__).parent.parent.parent / "core"
        if not core_dir.exists():
            pytest.skip("Core directory not found")

        core_files = get_python_files(str(core_dir), "*.py")

        forbidden_modules = ["infra", "api", "container"]
        violations = {}

        for core_file in core_files:
            imports = check_forbidden_imports(core_file, forbidden_modules)
            if imports:
                violations[str(core_file.relative_to(core_dir.parent))] = imports

        assert not violations, (
            "\nERROR: Core domain importing infrastructure/API layers:\n"
            + "\n".join(
                f"  {file}:\n    " + "\n    ".join(imports)
                for file, imports in violations.items()
            )
            + "\n\nINFO: Fix: Core domain should be pure business logic"
        )

    def test_all_route_files_have_dependency_providers(self):
        """Each API module with routes SHOULD have a dependencies.py file.

        This ensures consistent dependency injection patterns across all APIs.
        """
        api_dir = Path(__file__).parent.parent.parent / "api"
        route_files = get_python_files(str(api_dir), "routes.py")

        missing_dependencies = []
        for route_file in route_files:
            # Skip auth routes as they don't need use cases
            if "auth" in str(route_file):
                continue

            # Check if dependencies.py exists in same directory
            dep_file = route_file.parent / "dependencies.py"
            if not dep_file.exists():
                missing_dependencies.append(
                    str(route_file.relative_to(api_dir.parent))
                )

        # This is a warning, not a hard failure
        if missing_dependencies:
            pytest.skip(
                "WARNING:  Some API modules missing dependencies.py:\n"
                + "\n".join(f"  - {file}" for file in missing_dependencies)
                + "\n\nINFO: Consider adding dependencies.py for consistent DI patterns"
            )


class TestDependencyInjectionPatterns:
    """Test that dependency injection is used correctly."""

    def test_routes_use_depends_for_use_cases(self):
        """Routes should use Depends() to inject use cases, not instantiate them.

        This is a positive test - we check that routes follow the correct pattern.
        """
        api_dir = Path(__file__).parent.parent.parent / "api"
        route_files = get_python_files(str(api_dir), "routes.py")

        routes_with_di = []
        for route_file in route_files:
            try:
                with open(route_file, 'r', encoding='utf-8') as f:
                    content = f.read()
                    # Check for Depends() pattern
                    if "Depends(get_" in content and "use_case" in content:
                        routes_with_di.append(route_file.name)
            except (UnicodeDecodeError, IOError):
                continue

        # At least some routes should use DI (we know generate_input_files does)
        assert len(routes_with_di) > 0, (
            "No routes found using Depends() for use case injection. "
            "This might indicate a test setup issue."
        )


if __name__ == "__main__":
    # Allow running this file directly for quick checks
    pytest.main([__file__, "-v"])


================================================
FILE: build_stream/tests/performance/test_local_repo_performance.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Performance tests for Local Repository API."""

import time
import uuid
from pathlib import Path
from unittest.mock import patch

import pytest

from tests.integration.api.local_repo.conftest import setup_input_files

# Import fixtures needed for performance tests
pytest_plugins = ["tests.integration.api.local_repo.conftest"]


class TestLocalRepoPerformance:
    """Performance tests for create local repository API."""

    @pytest.mark.performance
    def test_response_time_under_threshold(self, client, auth_headers, created_job, nfs_queue_dir, input_dir):
        """Test that API response time is under acceptable threshold."""
        # Create actual input directory for this test
        input_dir_for_job = input_dir / created_job / "input"
        input_dir_for_job.mkdir(parents=True, exist_ok=True)
        (input_dir_for_job / "test.txt").write_text("test content")

        with patch(
            "infra.repositories.nfs_input_repository"
            ".NfsInputRepository.get_source_input_repository_path",
            return_value=input_dir_for_job,
        ), patch(
            "infra.repositories.nfs_input_repository"
            ".NfsInputRepository.get_destination_input_repository_path",
            return_value=nfs_queue_dir / "dest_input",
        ), patch(
            "infra.repositories.nfs_playbook_queue_request_repository"
            ".NfsPlaybookQueueRequestRepository.is_available",
            return_value=True,
        ):

            start_time = time.time()
            response = client.post(
                f"/api/v1/jobs/{created_job}/stages/create-local-repository",
                headers=auth_headers,
            )
            end_time = time.time()

            response_time = end_time - start_time

            # Assert response is successful or handles gracefully
            assert response.status_code in [202, 400]

            # Assert response time is under threshold (5 seconds for performance test)
            assert response_time < 5.0, f"Response time {response_time}s exceeds threshold of 5.0s"

    @pytest.mark.performance
    def test_concurrent_requests_performance(self, client, auth_headers, created_job, nfs_queue_dir, input_dir):
        """Test performance under concurrent load."""
        # Create actual input directory for this test
        input_dir_for_job = input_dir / created_job / "input"
        input_dir_for_job.mkdir(parents=True, exist_ok=True)
        (input_dir_for_job / "test.txt").write_text("test content")

        with patch(
            "infra.repositories.nfs_input_repository"
            ".NfsInputRepository.get_source_input_repository_path",
            return_value=input_dir_for_job,
        ), patch(
            "infra.repositories.nfs_input_repository"
            ".NfsInputRepository.get_destination_input_repository_path",
            return_value=nfs_queue_dir / "dest_input",
        ), patch(
            "infra.repositories.nfs_playbook_queue_request_repository"
            ".NfsPlaybookQueueRequestRepository.is_available",
            return_value=True,
        ):

            import threading
            results = []
            response_times = []

            def make_request():
                start_time = time.time()
                response = client.post(
                    f"/api/v1/jobs/{created_job}/stages/create-local-repository",
                    headers=auth_headers,
                )
                end_time = time.time()
                results.append(response)
                response_times.append(end_time - start_time)

            # Create and start threads (reduced from 10 to 5 for stability)
            threads = [threading.Thread(target=make_request) for _ in range(5)]

            start_time = time.time()
            for t in threads:
                t.start()
            for t in threads:
                t.join()
            end_time = time.time()

            # Assert all requests completed
            assert len(results) == 5

            # Assert responses are handled gracefully
            for response in results:
                assert response.status_code in [202, 400, 409, 500]

            # Assert average response time is reasonable
            avg_response_time = sum(response_times) / len(response_times)
            assert avg_response_time < 5.0

            # Assert total time is reasonable
            total_time = end_time - start_time
            assert total_time < 10.0
            # Average response time should be reasonable
            if response_times:
                avg_response_time = sum(response_times) / len(response_times)
                assert avg_response_time < 1.0, f"Average response time {avg_response_time}s exceeds threshold of 1.0s"

    @pytest.mark.performance
    def test_memory_usage_stable(self, client, auth_headers, created_job, nfs_queue_dir, input_dir):
        """Test that memory usage remains stable over multiple requests."""
        # Skip if psutil is not available
        try:
            import psutil
            import os
        except ImportError:
            pytest.skip("psutil not available for memory monitoring")

        process = psutil.Process(os.getpid())
        initial_memory = process.memory_info().rss

        # Create actual input directory for this test
        input_dir_for_job = input_dir / created_job / "input"
        input_dir_for_job.mkdir(parents=True, exist_ok=True)
        (input_dir_for_job / "test.txt").write_text("test content")

        with patch(
            "infra.repositories.nfs_input_repository"
            ".NfsInputRepository.get_source_input_repository_path",
            return_value=input_dir_for_job,
        ), patch(
            "infra.repositories.nfs_input_repository"
            ".NfsInputRepository.get_destination_input_repository_path",
            return_value=nfs_queue_dir / "dest_input",
        ), patch(
            "infra.repositories.nfs_playbook_queue_request_repository"
            ".NfsPlaybookQueueRequestRepository.is_available",
            return_value=True,
        ):

            # Make multiple requests (reduced from 50 to 20)
            for _ in range(20):
                response = client.post(
                    f"/api/v1/jobs/{created_job}/stages/create-local-repository",
                    headers=auth_headers,
                )
                assert response.status_code in [202, 400]

            final_memory = process.memory_info().rss
            memory_increase = final_memory - initial_memory

            # Memory increase should be minimal (less than 100MB)
            assert memory_increase < 100 * 1024 * 1024, f"Memory increased by {memory_increase / 1024 / 1024:.2f}MB"

    @pytest.mark.performance
    def test_large_correlation_id_handling(self, client, auth_headers, created_job, nfs_queue_dir, input_dir):
        """Test performance with large correlation IDs."""
        # Create actual input directory for this test
        input_dir_for_job = input_dir / created_job / "input"
        input_dir_for_job.mkdir(parents=True, exist_ok=True)
        (input_dir_for_job / "test.txt").write_text("test content")

        # Create very large correlation ID (but still reasonable)
        large_correlation_id = "x" * 1000  # Reduced from 10000

        with patch(
            "infra.repositories.nfs_input_repository"
            ".NfsInputRepository.get_source_input_repository_path",
            return_value=input_dir_for_job,
        ), patch(
            "infra.repositories.nfs_input_repository"
            ".NfsInputRepository.get_destination_input_repository_path",
            return_value=nfs_queue_dir / "dest_input",
        ), patch(
            "infra.repositories.nfs_playbook_queue_request_repository"
            ".NfsPlaybookQueueRequestRepository.is_available",
            return_value=True,
        ):

            start_time = time.time()
            response = client.post(
                f"/api/v1/jobs/{created_job}/stages/create-local-repository",
                headers={**auth_headers, "X-Correlation-Id": large_correlation_id},
            )
            end_time = time.time()

            response_time = end_time - start_time

            # Should handle large correlation IDs gracefully (may fail validation)
            assert response.status_code in [202, 400]

            # Response time should still be reasonable
            assert response_time < 3.0, f"Response time {response_time}s with large correlation ID exceeds threshold"


================================================
FILE: build_stream/tests/unit/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


================================================
FILE: build_stream/tests/unit/api/auth/test_password_handler.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for password_handler module."""

import pytest

from api.auth.password_handler import (
    generate_client_id,
    generate_client_secret,
    generate_credentials,
    hash_password,
    verify_password,
)
from tests.utils.test_data import generate_secure_password, generate_password_pair


@pytest.fixture
def test_password():
    """Generate a random test password for each test."""
    return generate_secure_password(16)


@pytest.fixture
def test_password_pair():
    """Generate a pair of different test passwords."""
    return generate_password_pair(16)


@pytest.mark.unit
class TestPasswordHashing:
    """Test suite for password hashing functions."""

    def test_hash_password_returns_argon2_hash(self, test_password):  # noqa: W0621
        """Test that hash_password returns Argon2id hash."""
        hashed = hash_password(test_password)

        assert hashed.startswith("$argon2id$")
        assert test_password not in hashed

    def test_hash_password_different_for_same_input(self, test_password):  # noqa: W0621
        """Test that hashing same password twice produces different hashes."""
        hash1 = hash_password(test_password)
        hash2 = hash_password(test_password)

        assert hash1 != hash2

    def test_verify_password_correct_password(self, test_password):  # noqa: W0621
        """Test verify_password returns True for correct password."""
        hashed = hash_password(test_password)

        assert verify_password(test_password, hashed) is True

    def test_verify_password_incorrect_password(self, test_password_pair):  # noqa: W0621
        """Test verify_password returns False for incorrect password."""
        correct_password, wrong_password = test_password_pair
        hashed = hash_password(correct_password)

        assert verify_password(wrong_password, hashed) is False

    def test_verify_password_invalid_hash(self, test_password):  # noqa: W0621
        """Test verify_password returns False for invalid hash."""
        assert verify_password(test_password, "invalid_hash") is False

    def test_generated_password_strength(self, test_password):  # noqa: W0621
        """Test that generated passwords meet strength requirements."""
        # Password should be at least 16 characters
        assert len(test_password) >= 16

        # Should contain at least one lowercase letter
        assert any(c.islower() for c in test_password)

        # Should contain at least one uppercase letter
        assert any(c.isupper() for c in test_password)

        # Should contain at least one digit
        assert any(c.isdigit() for c in test_password)

        # Should contain at least one special character
        special_chars = "!@#$%^&*"
        assert any(c in special_chars for c in test_password)


@pytest.mark.unit
class TestCredentialGeneration:
    """Test suite for credential generation functions."""

    def test_generate_client_id_format(self):
        """Test client_id has correct format."""
        client_id = generate_client_id()

        assert client_id.startswith("bld_")
        assert len(client_id) == 36

    def test_generate_client_id_unique(self):
        """Test client_id is unique each time."""
        ids = [generate_client_id() for _ in range(100)]

        assert len(set(ids)) == 100

    def test_generate_client_secret_format(self):
        """Test client_secret has correct format."""
        client_secret = generate_client_secret()

        assert client_secret.startswith("bld_s_")
        assert len(client_secret) > 40

    def test_generate_client_secret_unique(self):
        """Test client_secret is unique each time."""
        secrets = [generate_client_secret() for _ in range(100)]

        assert len(set(secrets)) == 100

    def test_generate_credentials_returns_tuple(self):
        """Test generate_credentials returns correct tuple."""
        client_id, client_secret, hashed_secret = generate_credentials()

        assert client_id.startswith("bld_")
        assert client_secret.startswith("bld_s_")
        assert hashed_secret.startswith("$argon2id$")

    def test_generate_credentials_secret_verifiable(self):
        """Test that generated secret can be verified against hash."""
        _, client_secret, hashed_secret = generate_credentials()

        assert verify_password(client_secret, hashed_secret) is True


================================================
FILE: build_stream/tests/unit/api/auth/test_service.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for AuthService."""

import pytest

from api.auth.service import (
    AuthenticationError,
    AuthService,
    ClientExistsError,
    MaxClientsReachedError,
)
from tests.mocks.mock_vault_client import MockVaultClient


@pytest.mark.unit
class TestAuthServiceCredentialVerification:
    """Test suite for AuthService.verify_registration_credentials."""

    def test_verify_valid_credentials(self, auth_service: AuthService):
        """Test verification with valid credentials."""
        result = auth_service.verify_registration_credentials(
            MockVaultClient.DEFAULT_TEST_USERNAME,
            MockVaultClient.DEFAULT_TEST_PASSWORD,
        )
        assert result is True

    def test_verify_invalid_username(self, auth_service: AuthService):
        """Test verification with invalid username."""
        with pytest.raises(AuthenticationError):
            auth_service.verify_registration_credentials(
                "wrong_username",
                MockVaultClient.DEFAULT_TEST_PASSWORD,
            )

    def test_verify_invalid_password(self, auth_service: AuthService):
        """Test verification with invalid password."""
        with pytest.raises(AuthenticationError):
            auth_service.verify_registration_credentials(
                MockVaultClient.DEFAULT_TEST_USERNAME,
                "wrong_password",
            )


@pytest.mark.unit
class TestAuthServiceClientRegistration:
    """Test suite for AuthService.register_client."""

    def test_register_client_success(self, auth_service: AuthService):
        """Test successful client registration."""
        result = auth_service.register_client(
            client_name="test-client",
            description="Test description",
            allowed_scopes=["catalog:read"],
        )

        assert result.client_id.startswith("bld_")
        assert result.client_secret.startswith("bld_s_")
        assert result.client_name == "test-client"
        assert result.allowed_scopes == ["catalog:read"]

    def test_register_client_default_scopes(self, auth_service: AuthService):
        """Test registration uses default scopes when not specified."""
        result = auth_service.register_client(client_name="test-client")

        assert result.allowed_scopes == ["catalog:read"]

    def test_register_client_max_clients_reached(
        self,
        mock_vault_client: MockVaultClient,
    ):
        """Test registration fails when max clients reached."""
        mock_vault_client.add_test_client()
        service = AuthService(vault_client=mock_vault_client)

        with pytest.raises(MaxClientsReachedError):
            service.register_client(client_name="new-client")

    def test_register_client_duplicate_name(self, auth_service: AuthService):
        """Test registration fails for duplicate client name."""
        auth_service.register_client(client_name="test-client")

        with pytest.raises((ClientExistsError, MaxClientsReachedError)):
            auth_service.register_client(client_name="test-client")


================================================
FILE: build_stream/tests/unit/api/auth/test_token_service.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for AuthService token generation functionality."""

# pylint: disable=redefined-outer-name

import pytest

from api.auth.service import (
    AuthService,
    ClientDisabledError,
    InvalidClientError,
    InvalidScopeError,
)
from tests.mocks.mock_jwt_handler import MockJWTHandler
from tests.mocks.mock_vault_client import MockVaultClient


@pytest.fixture
def mock_jwt_handler():
    """Create a MockJWTHandler for testing."""
    return MockJWTHandler()


@pytest.fixture
def mock_vault_with_active_client():
    """Create a MockVaultClient with an active registered client."""
    vault = MockVaultClient()
    vault.add_test_client(
        client_id="bld_1234567890abcdef1234567890abcdef",
        client_name="test-client",
        is_active=True,
    )
    return vault


@pytest.fixture
def mock_vault_with_disabled_client():
    """Create a MockVaultClient with a disabled registered client."""
    vault = MockVaultClient()
    vault.add_test_client(
        client_id="bld_1234567890abcdef1234567890abcdef",
        client_name="disabled-client",
        is_active=False,
    )
    return vault


@pytest.fixture
def test_client_id():
    """Return the test client ID."""
    return "bld_1234567890abcdef1234567890abcdef"


@pytest.fixture
def test_client_secret():
    """Return the test client secret (matches hash in mock)."""
    return "test_secret"


@pytest.mark.unit
class TestAuthServiceClientVerification:
    """Test suite for AuthService.verify_client_credentials."""

    def test_verify_valid_client_credentials(
        self,
        mock_vault_with_active_client: MockVaultClient,
        test_client_id: str,
        test_client_secret: str,
    ):
        """Test verification with valid client credentials."""
        service = AuthService(vault_client=mock_vault_with_active_client)

        result = service.verify_client_credentials(
            client_id=test_client_id,
            client_secret=test_client_secret,
        )

        assert result is not None
        assert result["client_name"] == "test-client"
        assert result["is_active"] is True

    def test_verify_invalid_client_id(
        self,
        mock_vault_with_active_client: MockVaultClient,
        test_client_secret: str,
    ):
        """Test verification with unknown client_id."""
        service = AuthService(vault_client=mock_vault_with_active_client)

        with pytest.raises(InvalidClientError):
            service.verify_client_credentials(
                client_id="bld_unknown_client_id_here_1234",
                client_secret=test_client_secret,
            )

    def test_verify_invalid_client_secret(
        self,
        mock_vault_with_active_client: MockVaultClient,
        test_client_id: str,
    ):
        """Test verification with invalid client_secret."""
        service = AuthService(vault_client=mock_vault_with_active_client)

        with pytest.raises(InvalidClientError):
            service.verify_client_credentials(
                client_id=test_client_id,
                client_secret="wrong_secret",
            )

    def test_verify_disabled_client(
        self,
        mock_vault_with_disabled_client: MockVaultClient,
        test_client_id: str,
        test_client_secret: str,
    ):
        """Test verification fails for disabled client."""
        service = AuthService(vault_client=mock_vault_with_disabled_client)

        with pytest.raises(ClientDisabledError):
            service.verify_client_credentials(
                client_id=test_client_id,
                client_secret=test_client_secret,
            )

    def test_verify_empty_vault(self, mock_vault_client: MockVaultClient):
        """Test verification fails when no clients registered."""
        service = AuthService(vault_client=mock_vault_client)

        with pytest.raises(InvalidClientError):
            service.verify_client_credentials(
                client_id="bld_any_client_id_here_12345678",
                client_secret="any_secret",
            )


@pytest.mark.unit
class TestAuthServiceTokenGeneration:
    """Test suite for AuthService.generate_token."""

    def test_generate_token_success(
        self,
        mock_vault_with_active_client: MockVaultClient,
        mock_jwt_handler: MockJWTHandler,
        test_client_id: str,
        test_client_secret: str,
    ):
        """Test successful token generation."""
        service = AuthService(
            vault_client=mock_vault_with_active_client,
            jwt_handler=mock_jwt_handler,
        )

        result = service.generate_token(
            client_id=test_client_id,
            client_secret=test_client_secret,
        )

        assert result is not None
        assert result.access_token is not None
        assert len(result.access_token) > 0
        assert result.token_type == "Bearer"
        assert result.expires_in > 0
        assert "catalog:read" in result.scope

    def test_generate_token_with_valid_scope(
        self,
        mock_vault_with_active_client: MockVaultClient,
        mock_jwt_handler: MockJWTHandler,
        test_client_id: str,
        test_client_secret: str,
    ):
        """Test token generation with valid requested scope."""
        service = AuthService(
            vault_client=mock_vault_with_active_client,
            jwt_handler=mock_jwt_handler,
        )

        result = service.generate_token(
            client_id=test_client_id,
            client_secret=test_client_secret,
            requested_scope="catalog:read",
        )

        assert result is not None
        assert result.scope == "catalog:read"

    def test_generate_token_with_invalid_scope(
        self,
        mock_vault_with_active_client: MockVaultClient,
        mock_jwt_handler: MockJWTHandler,
        test_client_id: str,
        test_client_secret: str,
    ):
        """Test token generation fails with unauthorized scope."""
        service = AuthService(
            vault_client=mock_vault_with_active_client,
            jwt_handler=mock_jwt_handler,
        )

        with pytest.raises(InvalidScopeError):
            service.generate_token(
                client_id=test_client_id,
                client_secret=test_client_secret,
                requested_scope="admin:full",
            )

    def test_generate_token_invalid_client(
        self,
        mock_vault_with_active_client: MockVaultClient,
        mock_jwt_handler: MockJWTHandler,
        test_client_secret: str,
    ):
        """Test token generation fails with invalid client."""
        service = AuthService(
            vault_client=mock_vault_with_active_client,
            jwt_handler=mock_jwt_handler,
        )

        with pytest.raises(InvalidClientError):
            service.generate_token(
                client_id="bld_invalid_client_id_12345678",
                client_secret=test_client_secret,
            )

    def test_generate_token_disabled_client(
        self,
        mock_vault_with_disabled_client: MockVaultClient,
        mock_jwt_handler: MockJWTHandler,
        test_client_id: str,
        test_client_secret: str,
    ):
        """Test token generation fails for disabled client."""
        service = AuthService(
            vault_client=mock_vault_with_disabled_client,
            jwt_handler=mock_jwt_handler,
        )

        with pytest.raises(ClientDisabledError):
            service.generate_token(
                client_id=test_client_id,
                client_secret=test_client_secret,
            )

    def test_generate_token_jwt_structure(
        self,
        mock_vault_with_active_client: MockVaultClient,
        mock_jwt_handler: MockJWTHandler,
        test_client_id: str,
        test_client_secret: str,
    ):
        """Test that generated token has valid JWT structure."""
        service = AuthService(
            vault_client=mock_vault_with_active_client,
            jwt_handler=mock_jwt_handler,
        )

        result = service.generate_token(
            client_id=test_client_id,
            client_secret=test_client_secret,
        )

        # JWT should have 3 parts separated by dots
        parts = result.access_token.split(".")
        assert len(parts) == 3, "JWT should have header.payload.signature format"

        # Each part should be non-empty
        for part in parts:
            assert len(part) > 0, "JWT parts should not be empty"


================================================
FILE: build_stream/tests/unit/api/build_image/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


================================================
FILE: build_stream/tests/unit/api/build_image/test_routes.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for Build Image API routes."""

import uuid
import pytest
from fastapi import HTTPException, status

from api.build_image.routes import create_build_image, _build_error_response
from api.build_image.schemas import CreateBuildImageRequest, CreateBuildImageResponse
from core.build_image.exceptions import (
    BuildImageDomainError,
    InvalidArchitectureError,
    InvalidFunctionalGroupsError,
    InvalidImageKeyError,
    InventoryHostMissingError,
)
from core.jobs.exceptions import InvalidStateTransitionError, JobNotFoundError
from core.jobs.value_objects import ClientId, CorrelationId, JobId

# Helper function to create valid UUIDs for testing
def create_test_uuid():
    return str(uuid.uuid4())
from orchestrator.build_image.commands import CreateBuildImageCommand
from orchestrator.build_image.dtos import BuildImageResponse


class MockCreateBuildImageUseCase:
    """Mock use case for testing."""

    def __init__(self, error_to_raise=None):
        """Initialize mock with optional failure."""
        self.error_to_raise = error_to_raise
        self.executed_commands = []

    def execute(self, command):
        """Mock execute method."""
        self.executed_commands.append(command)
        if self.error_to_raise:
            raise self.error_to_raise

        return BuildImageResponse(
            job_id=str(command.job_id),
            stage_name="build-image",
            status="accepted",
            submitted_at="2026-02-12T18:30:00.000Z",
            correlation_id=str(command.correlation_id),
            architecture=command.architecture,
            image_key=command.image_key,
            functional_groups=command.functional_groups,
        )


class TestBuildImageRoutes:
    """Test cases for build image routes."""

    def test_build_error_response(self):
        """Test error response builder."""
        response = _build_error_response(
            "TEST_ERROR",
            "Test error message",
            "corr-123"
        )

        assert response.error == "TEST_ERROR"
        assert response.message == "Test error message"
        assert response.correlation_id == "corr-123"
        assert "Z" in response.timestamp  # ISO format with Z suffix

    def test_create_build_image_success(self):
        """Test successful build image creation."""
        test_correlation_id = create_test_uuid()
        test_job_id = create_test_uuid()
        use_case = MockCreateBuildImageUseCase()

        request_body = CreateBuildImageRequest(
            architecture="x86_64",
            image_key="test-image",
            functional_groups=["group1", "group2"]
        )

        response = create_build_image(
            job_id=test_job_id,
            request_body=request_body,
            token_data={"client_id": "client-456"},
            use_case=use_case,
            correlation_id=CorrelationId(test_correlation_id)
        )

        assert isinstance(response, CreateBuildImageResponse)
        assert response.job_id == test_job_id
        assert response.stage == "build-image"
        assert response.status == "accepted"
        assert response.architecture == "x86_64"
        assert response.image_key == "test-image"
        assert response.functional_groups == ["group1", "group2"]
        assert response.correlation_id == test_correlation_id

        # Verify use case was called with correct command
        assert len(use_case.executed_commands) == 1
        command = use_case.executed_commands[0]
        assert isinstance(command, CreateBuildImageCommand)
        assert str(command.job_id) == test_job_id
        assert str(command.client_id) == "client-456"
        assert str(command.correlation_id) == test_correlation_id
        assert command.architecture == "x86_64"
        assert command.image_key == "test-image"
        assert command.functional_groups == ["group1", "group2"]

    def test_create_build_image_invalid_job_id(self):
        """Test with invalid job ID."""
        use_case = MockCreateBuildImageUseCase()

        request_body = CreateBuildImageRequest(
            architecture="x86_64",
            image_key="test-image",
            functional_groups=["group1"]
        )

        with pytest.raises(HTTPException) as exc_info:
            create_build_image(
                job_id="",  # Invalid empty job ID
                request_body=request_body,
                use_case=use_case,
                token_data={"client_id": "client-456"},
                correlation_id=CorrelationId(create_test_uuid())
            )

        assert exc_info.value.status_code == status.HTTP_400_BAD_REQUEST
        detail = exc_info.value.detail
        assert detail["error"] == "INVALID_JOB_ID"
        assert "Invalid job_id format" in detail["message"]

    def test_create_build_image_job_not_found(self):
        """Test when job is not found."""
        use_case = MockCreateBuildImageUseCase(
            error_to_raise=JobNotFoundError("Job not found", create_test_uuid())
        )

        request_body = CreateBuildImageRequest(
            architecture="x86_64",
            image_key="test-image",
            functional_groups=["group1"]
        )

        with pytest.raises(HTTPException) as exc_info:
            create_build_image(
                job_id=create_test_uuid(),
                request_body=request_body,
                use_case=use_case,
                token_data={"client_id": "client-456"},
                correlation_id=CorrelationId(create_test_uuid())
            )

        assert exc_info.value.status_code == status.HTTP_404_NOT_FOUND
        detail = exc_info.value.detail
        assert detail["error"] == "JOB_NOT_FOUND"

    def test_create_build_image_invalid_state_transition(self):
        """Test when stage is not in PENDING state."""
        use_case = MockCreateBuildImageUseCase(
            error_to_raise=InvalidStateTransitionError("Job", create_test_uuid(), "PENDING", "RUNNING", create_test_uuid())
        )

        request_body = CreateBuildImageRequest(
            architecture="x86_64",
            image_key="test-image",
            functional_groups=["group1"]
        )

        with pytest.raises(HTTPException) as exc_info:
            create_build_image(
                job_id=create_test_uuid(),
                request_body=request_body,
                use_case=use_case,
                token_data={"client_id": "client-456"},
                correlation_id=CorrelationId(create_test_uuid())
            )

        assert exc_info.value.status_code == status.HTTP_409_CONFLICT
        detail = exc_info.value.detail
        assert detail["error"] == "INVALID_STATE_TRANSITION"

    def test_create_build_image_invalid_architecture(self):
        """Test with invalid architecture (domain-level validation)."""
        use_case = MockCreateBuildImageUseCase(
            error_to_raise=InvalidArchitectureError("Invalid architecture", create_test_uuid())
        )

        request_body = CreateBuildImageRequest(
            architecture="x86_64",  # Valid for schema but will trigger domain error
            image_key="test-image",
            functional_groups=["group1"]
        )

        with pytest.raises(HTTPException) as exc_info:
            create_build_image(
                job_id=create_test_uuid(),
                request_body=request_body,
                use_case=use_case,
                token_data={"client_id": "client-456"},
                correlation_id=CorrelationId(create_test_uuid())
            )

        assert exc_info.value.status_code == status.HTTP_400_BAD_REQUEST
        detail = exc_info.value.detail
        assert detail["error"] == "INVALID_ARCHITECTURE"

    def test_create_build_image_invalid_image_key(self):
        """Test with invalid image key."""
        use_case = MockCreateBuildImageUseCase(
            error_to_raise=InvalidImageKeyError("Invalid image key", create_test_uuid())
        )

        request_body = CreateBuildImageRequest(
            architecture="x86_64",
            image_key="invalid@key",
            functional_groups=["group1"]
        )

        with pytest.raises(HTTPException) as exc_info:
            create_build_image(
                job_id=create_test_uuid(),
                request_body=request_body,
                use_case=use_case,
                token_data={"client_id": "client-456"},
                correlation_id=CorrelationId(create_test_uuid())
            )

        assert exc_info.value.status_code == status.HTTP_400_BAD_REQUEST
        detail = exc_info.value.detail
        assert detail["error"] == "INVALID_IMAGE_KEY"

    def test_create_build_image_invalid_functional_groups(self):
        """Test with invalid functional groups."""
        use_case = MockCreateBuildImageUseCase(
            error_to_raise=InvalidFunctionalGroupsError("Invalid groups", create_test_uuid())
        )

        request_body = CreateBuildImageRequest(
            architecture="x86_64",
            image_key="test-image",
            functional_groups=["invalid@group"]
        )

        with pytest.raises(HTTPException) as exc_info:
            create_build_image(
                job_id=create_test_uuid(),
                request_body=request_body,
                use_case=use_case,
                token_data={"client_id": "client-456"},
                correlation_id=CorrelationId(create_test_uuid())
            )

        assert exc_info.value.status_code == status.HTTP_400_BAD_REQUEST
        detail = exc_info.value.detail
        assert detail["error"] == "INVALID_FUNCTIONAL_GROUPS"

    def test_create_build_image_missing_inventory_host(self):
        """Test aarch64 build with missing inventory host."""
        use_case = MockCreateBuildImageUseCase(
            error_to_raise=InventoryHostMissingError("Missing host", create_test_uuid())
        )

        request_body = CreateBuildImageRequest(
            architecture="aarch64",
            image_key="test-image",
            functional_groups=["group1"]
        )

        with pytest.raises(HTTPException) as exc_info:
            create_build_image(
                job_id=create_test_uuid(),
                request_body=request_body,
                use_case=use_case,
                token_data={"client_id": "client-456"},
                correlation_id=CorrelationId(create_test_uuid())
            )

        assert exc_info.value.status_code == status.HTTP_400_BAD_REQUEST
        detail = exc_info.value.detail
        assert detail["error"] == "INVENTORY_HOST_MISSING"

    def test_create_build_image_domain_error(self):
        """Test with domain error."""
        use_case = MockCreateBuildImageUseCase(
            error_to_raise=BuildImageDomainError("Domain error", create_test_uuid())
        )

        request_body = CreateBuildImageRequest(
            architecture="x86_64",
            image_key="test-image",
            functional_groups=["group1"]
        )

        with pytest.raises(HTTPException) as exc_info:
            create_build_image(
                job_id=create_test_uuid(),
                request_body=request_body,
                use_case=use_case,
                token_data={"client_id": "client-456"},
                correlation_id=CorrelationId(create_test_uuid())
            )

        assert exc_info.value.status_code == status.HTTP_500_INTERNAL_SERVER_ERROR
        detail = exc_info.value.detail
        assert detail["error"] == "BUILD_IMAGE_ERROR"

    def test_create_build_image_unexpected_error(self):
        """Test with unexpected error."""
        use_case = MockCreateBuildImageUseCase(error_to_raise=RuntimeError("Unexpected error"))

        request_body = CreateBuildImageRequest(
            architecture="x86_64",
            image_key="test-image",
            functional_groups=["group1"]
        )

        with pytest.raises(HTTPException) as exc_info:
            create_build_image(
                job_id=create_test_uuid(),
                request_body=request_body,
                use_case=use_case,
                token_data={"client_id": "client-456"},
                correlation_id=CorrelationId(create_test_uuid())
            )

        assert exc_info.value.status_code == status.HTTP_500_INTERNAL_SERVER_ERROR
        detail = exc_info.value.detail
        assert detail["error"] == "INTERNAL_ERROR"
        assert detail["message"].lower().startswith("an unexpected error")


================================================
FILE: build_stream/tests/unit/api/catalog_roles/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


================================================
FILE: build_stream/tests/unit/api/catalog_roles/test_catalog_roles_service.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for CatalogRolesService."""

import io
import json
import zipfile
from unittest.mock import MagicMock

import pytest

from api.catalog_roles.service import (
    CatalogRolesService,
    RolesNotFoundError,
)
from core.jobs.exceptions import UpstreamStageNotCompletedError
from core.artifacts.entities import ArtifactRecord
from core.artifacts.exceptions import ArtifactNotFoundError
from core.artifacts.value_objects import ArtifactDigest, ArtifactKey, ArtifactKind, ArtifactRef
from core.jobs.value_objects import JobId, StageName, StageType, StageState


def _make_job_id() -> JobId:
    return JobId("019bf590-1234-7890-abcd-ef1234567890")


def _make_artifact_ref(key_value: str = "catalog/abc123/root-jsons.zip") -> ArtifactRef:
    return ArtifactRef(
        key=ArtifactKey(key_value),
        digest=ArtifactDigest("a" * 64),
        size_bytes=100,
        uri=f"memory://{key_value}",
    )


def _make_artifact_record(job_id: JobId, ref: ArtifactRef) -> ArtifactRecord:
    return ArtifactRecord(
        id="record-id-1",
        job_id=job_id,
        stage_name=StageName(StageType.PARSE_CATALOG.value),
        label="root-jsons",
        artifact_ref=ref,
        kind=ArtifactKind.ARCHIVE,
        content_type="application/zip",
        tags={"job_id": str(job_id)},
    )


def _make_zip_with_functional_layer(roles_data: dict, path: str = "x86_64/rhel/9.5/functional_layer.json") -> bytes:
    """Create an in-memory zip archive containing a functional_layer.json."""
    buf = io.BytesIO()
    with zipfile.ZipFile(buf, "w", zipfile.ZIP_DEFLATED) as zf:
        zf.writestr(path, json.dumps(roles_data))
    return buf.getvalue()


class TestCatalogRolesServiceGetRoles:
    """Tests for CatalogRolesService.get_roles."""

    def _make_service(self, artifact_store=None, artifact_metadata_repo=None, stage_repo=None, job_repo=None):
        # Create mock stage that is completed
        if stage_repo is None:
            stage_repo = MagicMock()
            mock_stage = MagicMock()
            mock_stage.stage_state = StageState.COMPLETED
            stage_repo.find_by_job_and_name.return_value = mock_stage
        
        return CatalogRolesService(
            artifact_store=artifact_store or MagicMock(),
            artifact_metadata_repo=artifact_metadata_repo or MagicMock(),
            stage_repo=stage_repo,
            job_repo=job_repo or MagicMock(),
        )
    
    def _make_service_with_artifacts(self, roles_data: dict, job_id=None, catalog_data=None):
        """Helper to create a service with both root-jsons and catalog-file artifacts set up."""
        if job_id is None:
            job_id = _make_job_id()
        
        # Create root-jsons artifact
        ref = _make_artifact_ref()
        record = _make_artifact_record(job_id, ref)
        zip_bytes = _make_zip_with_functional_layer(roles_data)
        
        # Create catalog-file artifact
        if catalog_data is None:
            catalog_data = {
                "Catalog": {
                    "Identifier": "test-image",
                    "FunctionalPackages": {
                        "pkg1": {"Architecture": ["x86_64"]},
                        "pkg2": {"Architecture": ["x86_64", "aarch64"]}
                    }
                }
            }
        catalog_ref = ArtifactRef(
            key=ArtifactKey("catalog/def456/catalog-file.json"),
            digest=ArtifactDigest("b" * 64),
            size_bytes=1024,
            uri="file:///catalog/def456/catalog-file.json",
        )
        catalog_record = ArtifactRecord(
            id="record-2",
            job_id=job_id,
            stage_name=StageName(StageType.PARSE_CATALOG.value),
            label="catalog-file",
            artifact_ref=catalog_ref,
            kind=ArtifactKind.FILE,
            content_type="application/json",
        )
        
        metadata_repo = MagicMock()
        def find_by_job_stage_and_label(job_id, stage_name, label):
            if label == "root-jsons":
                return record
            elif label == "catalog-file":
                return catalog_record
            return None
        metadata_repo.find_by_job_stage_and_label.side_effect = find_by_job_stage_and_label
        
        artifact_store = MagicMock()
        def retrieve(key, kind):
            if key.value == "catalog/abc123/root-jsons.zip":
                return zip_bytes
            elif key.value == "catalog/def456/catalog-file.json":
                return json.dumps(catalog_data).encode()
            raise ArtifactNotFoundError(key=key)
        artifact_store.retrieve.side_effect = retrieve
        
        return self._make_service(artifact_store, metadata_repo), job_id

    def test_returns_sorted_roles_from_functional_layer(self):
        """Returns sorted role names from functional_layer.json in the archive."""
        roles_data = {
            "Slurm Worker": {"packages": []},
            "Compiler": {"packages": []},
            "K8S Controller": {"packages": []},
        }
        
        service, job_id = self._make_service_with_artifacts(roles_data)
        result = service.get_roles(job_id)

        assert result["roles"] == ["Compiler", "K8S Controller", "Slurm Worker"]
        assert result["image_key"] == "test-image"
        assert set(result["architectures"]) == {"x86_64", "aarch64"}

    def test_raises_when_no_artifact_record(self):
        """Raises UpstreamStageNotCompletedError when no root-jsons record exists."""
        job_id = _make_job_id()

        metadata_repo = MagicMock()
        metadata_repo.find_by_job_stage_and_label.return_value = None

        service = self._make_service(artifact_metadata_repo=metadata_repo)

        with pytest.raises(UpstreamStageNotCompletedError):
            service.get_roles(job_id)

    def test_raises_when_artifact_not_in_store(self):
        """Raises UpstreamStageNotCompletedError when artifact file is missing from store."""
        job_id = _make_job_id()
        ref = _make_artifact_ref()
        record = _make_artifact_record(job_id, ref)

        metadata_repo = MagicMock()
        metadata_repo.find_by_job_stage_and_label.return_value = record

        artifact_store = MagicMock()
        artifact_store.retrieve.side_effect = ArtifactNotFoundError(key=ref.key.value)

        service = self._make_service(artifact_store, metadata_repo)

        with pytest.raises(UpstreamStageNotCompletedError):
            service.get_roles(job_id)

    def test_raises_when_no_functional_layer_in_archive(self):
        """Raises RolesNotFoundError when archive has no functional_layer.json."""
        job_id = _make_job_id()
        ref = _make_artifact_ref()
        record = _make_artifact_record(job_id, ref)

        buf = io.BytesIO()
        with zipfile.ZipFile(buf, "w") as zf:
            zf.writestr("x86_64/rhel/9.5/base_os.json", json.dumps({}))
        zip_bytes = buf.getvalue()

        metadata_repo = MagicMock()
        metadata_repo.find_by_job_stage_and_label.return_value = record

        artifact_store = MagicMock()
        artifact_store.retrieve.return_value = zip_bytes

        service = self._make_service(artifact_store, metadata_repo)

        with pytest.raises(RolesNotFoundError):
            service.get_roles(job_id)

    def test_raises_when_archive_is_corrupt(self):
        """Raises RolesNotFoundError when archive bytes are not a valid zip."""
        job_id = _make_job_id()
        ref = _make_artifact_ref()
        record = _make_artifact_record(job_id, ref)

        metadata_repo = MagicMock()
        metadata_repo.find_by_job_stage_and_label.return_value = record

        artifact_store = MagicMock()
        artifact_store.retrieve.return_value = b"this is not a zip file"

        service = self._make_service(artifact_store, metadata_repo)

        with pytest.raises(RolesNotFoundError):
            service.get_roles(job_id)

    def test_raises_when_functional_layer_json_is_malformed(self):
        """Raises RolesNotFoundError when functional_layer.json is not valid JSON."""
        job_id = _make_job_id()
        ref = _make_artifact_ref()
        record = _make_artifact_record(job_id, ref)

        buf = io.BytesIO()
        with zipfile.ZipFile(buf, "w") as zf:
            zf.writestr("x86_64/rhel/9.5/functional_layer.json", b"not valid json {{")
        zip_bytes = buf.getvalue()

        metadata_repo = MagicMock()
        metadata_repo.find_by_job_stage_and_label.return_value = record

        artifact_store = MagicMock()
        artifact_store.retrieve.return_value = zip_bytes

        service = self._make_service(artifact_store, metadata_repo)

        with pytest.raises(RolesNotFoundError):
            service.get_roles(job_id)

    def test_raises_when_functional_layer_json_is_not_a_dict(self):
        """Raises RolesNotFoundError when functional_layer.json root is not a dict."""
        job_id = _make_job_id()
        ref = _make_artifact_ref()
        record = _make_artifact_record(job_id, ref)

        zip_bytes = _make_zip_with_functional_layer(["role1", "role2"])  # list, not dict

        metadata_repo = MagicMock()
        metadata_repo.find_by_job_stage_and_label.return_value = record

        artifact_store = MagicMock()
        artifact_store.retrieve.return_value = zip_bytes

        service = self._make_service(artifact_store, metadata_repo)

        with pytest.raises(RolesNotFoundError):
            service.get_roles(job_id)

    def test_returns_empty_list_for_empty_functional_layer(self):
        """Returns empty list when functional_layer.json has no roles."""
        service, job_id = self._make_service_with_artifacts({})
        result = service.get_roles(job_id)

        assert result["roles"] == []
        assert result["image_key"] == "test-image"
        assert set(result["architectures"]) == {"x86_64", "aarch64"}

    def test_uses_first_functional_layer_found_in_archive(self):
        """Uses the first functional_layer.json found when multiple arch dirs exist."""
        # Create custom zip with multiple functional_layer.json files
        buf = io.BytesIO()
        with zipfile.ZipFile(buf, "w", zipfile.ZIP_DEFLATED) as zf:
            zf.writestr(
                "aarch64/rhel/9.5/functional_layer.json",
                json.dumps({"RoleA": {}, "RoleB": {}}),
            )
            zf.writestr(
                "x86_64/rhel/9.5/functional_layer.json",
                json.dumps({"RoleX": {}, "RoleY": {}}),
            )
        zip_bytes = buf.getvalue()
        
        job_id = _make_job_id()
        ref = _make_artifact_ref()
        record = _make_artifact_record(job_id, ref)
        
        # Create catalog-file artifact
        catalog_data = {
            "Catalog": {
                "Identifier": "test-image",
                "Architectures": ["x86_64"]
            }
        }
        catalog_ref = ArtifactRef(
            key=ArtifactKey("catalog/def456/catalog-file.json"),
            digest=ArtifactDigest("b" * 64),
            size_bytes=1024,
            uri="file:///catalog/def456/catalog-file.json",
        )
        catalog_record = ArtifactRecord(
            id="record-2",
            job_id=job_id,
            stage_name=StageName(StageType.PARSE_CATALOG.value),
            label="catalog-file",
            artifact_ref=catalog_ref,
            kind=ArtifactKind.FILE,
            content_type="application/json",
        )
        
        metadata_repo = MagicMock()
        def find_by_job_stage_and_label(job_id, stage_name, label):
            if label == "root-jsons":
                return record
            elif label == "catalog-file":
                return catalog_record
            return None
        metadata_repo.find_by_job_stage_and_label.side_effect = find_by_job_stage_and_label
        
        artifact_store = MagicMock()
        def retrieve(key, kind):
            if key.value == "catalog/abc123/root-jsons.zip":
                return zip_bytes
            elif key.value == "catalog/def456/catalog-file.json":
                return json.dumps(catalog_data).encode()
            raise ArtifactNotFoundError(key=key)
        artifact_store.retrieve.side_effect = retrieve
        
        service = self._make_service(artifact_store, metadata_repo)
        result = service.get_roles(job_id)

        # Should return roles from whichever functional_layer.json is found first
        assert isinstance(result["roles"], list)
        assert len(result["roles"]) == 2

    def test_queries_correct_stage_and_label(self):
        """Verifies the metadata repo is queried with the correct stage and label."""
        job_id = _make_job_id()

        metadata_repo = MagicMock()
        metadata_repo.find_by_job_stage_and_label.return_value = None

        service = self._make_service(artifact_metadata_repo=metadata_repo)

        with pytest.raises(UpstreamStageNotCompletedError):
            service.get_roles(job_id)

        metadata_repo.find_by_job_stage_and_label.assert_called_once_with(
            job_id=job_id,
            stage_name=StageName(StageType.PARSE_CATALOG.value),
            label="root-jsons",
        )


================================================
FILE: build_stream/tests/unit/api/jobs/test_dependencies.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for API dependencies."""

import pytest
from fastapi import HTTPException

from api.dependencies import get_client_id, get_idempotency_key
from core.jobs.value_objects import ClientId


class TestGetClientId:
    """Tests for get_client_id dependency function."""

    def test_valid_token_data_returns_client_id(self):
        """Valid token data should return ClientId."""
        token_data = {"client_id": "test-client-123"}

        client_id = get_client_id(token_data)

        assert isinstance(client_id, ClientId)
        assert client_id.value == "test-client-123"

    def test_token_data_with_different_client(self):
        """Token data with different client should return correct ClientId."""
        token_data = {"client_id": "another-client"}

        client_id = get_client_id(token_data)

        assert client_id.value == "another-client"

    def test_missing_client_id_raises_error(self):
        """Missing client_id key should raise KeyError."""
        token_data = {"scopes": ["job:write"]}

        with pytest.raises(KeyError):
            get_client_id(token_data)

    def test_empty_client_id_raises_value_error(self):
        """Empty client_id should raise ValueError from ClientId validation."""
        token_data = {"client_id": ""}

        with pytest.raises(ValueError):
            get_client_id(token_data)


class TestGetIdempotencyKey:
    """Tests for get_idempotency_key dependency function."""

    def test_valid_idempotency_key_returned(self):
        """Valid idempotency key should be returned unchanged."""
        key = "test-key-12345"

        result = get_idempotency_key(key)

        assert result == "test-key-12345"

    def test_idempotency_key_with_special_chars(self):
        """Idempotency key with special characters should be accepted."""
        key = "test-key-abc-123_xyz"

        result = get_idempotency_key(key)

        assert result == "test-key-abc-123_xyz"

    def test_empty_idempotency_key_raises_422(self):
        """Empty idempotency key should raise 422 HTTPException."""
        key = ""

        with pytest.raises(HTTPException) as exc_info:
            get_idempotency_key(key)

        assert exc_info.value.status_code == 422

    def test_whitespace_only_key_raises_422(self):
        """Whitespace-only idempotency key should raise 422 HTTPException."""
        key = "   "

        with pytest.raises(HTTPException) as exc_info:
            get_idempotency_key(key)

        assert exc_info.value.status_code == 422

    def test_key_exceeding_max_length_raises_422(self):
        """Key exceeding max length should raise 422 HTTPException."""
        key = "a" * 256

        with pytest.raises(HTTPException) as exc_info:
            get_idempotency_key(key)

        assert exc_info.value.status_code == 422
        assert "length" in exc_info.value.detail.lower()

    def test_key_at_max_length_accepted(self):
        """Key at max length should be accepted."""
        key = "a" * 255

        result = get_idempotency_key(key)

        assert result == key
        assert len(result) == 255


================================================
FILE: build_stream/tests/unit/api/jobs/test_schemas.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for API schemas."""

# pylint: disable=too-few-public-methods

import pytest
from pydantic import ValidationError

from api.jobs.schemas import (
    CreateJobRequest,
    CreateJobResponse,
    CreateStageResponse,
    GetJobResponse,
    GetStageResponse,
    ErrorResponse,
)


class TestCreateJobRequest:
    """Tests for CreateJobRequest schema validation."""

    def test_valid_request_with_required_fields(self):
        """Valid request with required fields should create schema instance."""
        data = {"client_id": "client-123", "client_name": "test-client"}

        request = CreateJobRequest(**data)

        assert request.client_id == "client-123"
        assert request.client_name == "test-client"
        assert request.metadata is None

    def test_valid_request_with_metadata(self):
        """Valid request with metadata should create schema instance."""
        data = {
            "client_id": "client-123",
            "client_name": "test-client",
            "metadata": {"description": "Test", "tags": ["test"]}
        }

        request = CreateJobRequest(**data)

        assert request.client_id == "client-123"
        assert request.client_name == "test-client"
        assert request.metadata == {"description": "Test", "tags": ["test"]}

    def test_missing_client_id_raises_validation_error(self):
        """Missing client_id should raise ValidationError."""
        data = {"client_name": "test-client"}

        with pytest.raises(ValidationError) as exc_info:
            CreateJobRequest(**data)

        errors = exc_info.value.errors()
        assert any(e["loc"] == ("client_id",) for e in errors)

    def test_missing_client_name_is_allowed(self):
        """Test method."""
        data = {"client_id": "client-123"}

        request = CreateJobRequest(**data)

        assert request.client_id == "client-123"
        assert request.client_name is None

    def test_empty_client_id_raises_validation_error(self):
        """Test method."""
        data = {"client_id": ""}

        with pytest.raises(ValidationError) as exc_info:
            CreateJobRequest(**data)

        errors = exc_info.value.errors()
        assert any(e["loc"] == ("client_id",) for e in errors)

    def test_empty_client_name_raises_validation_error(self):
        """Test method."""
        data = {"client_id": "client-123", "client_name": ""}

        with pytest.raises(ValidationError) as exc_info:
            CreateJobRequest(**data)

        errors = exc_info.value.errors()
        assert any(e["loc"] == ("client_name",) for e in errors)

    def test_client_id_max_length_validation(self):
        """Test method."""
        data = {"client_id": "a" * 256}

        with pytest.raises(ValidationError):
            CreateJobRequest(**data)

    def test_client_name_max_length_validation(self):
        """Test method."""
        data = {"client_id": "client-123", "client_name": "a" * 256}

        with pytest.raises(ValidationError):
            CreateJobRequest(**data)

    def test_metadata_can_be_none(self):
        """Test method."""
        data = {"client_id": "client-123", "client_name": "test-client", "metadata": None}

        request = CreateJobRequest(**data)

        assert request.metadata is None


class TestCreateJobResponse:
    """Test class."""

    def test_valid_response_with_all_fields(self):
        """Test method."""
        data = {
            "job_id": "019bf590-1234-7890-abcd-ef1234567890",
            "correlation_id": "019bf590-5678-7890-abcd-ef1234567890",
            "job_state": "CREATED",
            "created_at": "2026-01-25T15:00:00+00:00",
            "stages": []
        }

        response = CreateJobResponse(**data)

        assert response.job_id == "019bf590-1234-7890-abcd-ef1234567890"
        assert response.correlation_id == "019bf590-5678-7890-abcd-ef1234567890"
        assert response.job_state == "CREATED"
        assert response.created_at == "2026-01-25T15:00:00+00:00"
        assert response.stages == []

    def test_missing_required_field_raises_validation_error(self):
        """Test method."""
        data = {
            "job_id": "019bf590-1234-7890-abcd-ef1234567890",
            "job_state": "CREATED",
        }

        with pytest.raises(ValidationError):
            CreateJobResponse(**data)


class TestCreateStageResponse:
    """Test class for CreateStageResponse."""

    def test_valid_create_stage_response(self):
        """Test method."""
        data = {
            "stage_name": "parse-catalog",
            "stage_state": "PENDING",
            "started_at": None,
            "ended_at": None,
            "error_code": None,
            "error_summary": None,
        }

        stage = CreateStageResponse(**data)

        assert stage.stage_name == "parse-catalog"
        assert stage.stage_state == "PENDING"
        assert stage.started_at is None
        assert stage.ended_at is None

    def test_create_stage_with_timestamps(self):
        """Test method."""
        data = {
            "stage_name": "parse-catalog",
            "stage_state": "RUNNING",
            "started_at": "2026-01-25T15:00:00Z",
            "ended_at": None,
            "error_code": None,
            "error_summary": None,
        }

        stage = CreateStageResponse(**data)

        assert stage.started_at == "2026-01-25T15:00:00Z"
        assert stage.ended_at is None

    def test_create_stage_with_error(self):
        """Test method."""
        data = {
            "stage_name": "parse-catalog",
            "stage_state": "FAILED",
            "started_at": "2026-01-25T15:00:00Z",
            "ended_at": "2026-01-25T15:01:00Z",
            "error_code": "CATALOG_PARSE_ERROR",
            "error_summary": "Invalid JSON format",
        }

        stage = CreateStageResponse(**data)

        assert stage.error_code == "CATALOG_PARSE_ERROR"
        assert stage.error_summary == "Invalid JSON format"


class TestGetStageResponse:
    """Test class for GetStageResponse."""

    def test_valid_get_stage_response(self):
        """Test method."""
        data = {
            "stage_name": "parse-catalog",
            "stage_state": "PENDING",
            "started_at": None,
            "ended_at": None,
            "error_code": None,
            "error_summary": None,
            "log_file_path": None,
        }

        stage = GetStageResponse(**data)

        assert stage.stage_name == "parse-catalog"
        assert stage.stage_state == "PENDING"
        assert stage.log_file_path is None

    def test_get_stage_with_log_file_path(self):
        """Test method."""
        data = {
            "stage_name": "local-repo",
            "stage_state": "COMPLETED",
            "started_at": "2026-01-25T15:00:00Z",
            "ended_at": "2026-01-25T15:10:00Z",
            "error_code": None,
            "error_summary": None,
            "log_file_path": "/opt/omnia/log/build_stream/job-123/local_repo_20260125_150000.log",
        }

        stage = GetStageResponse(**data)

        assert stage.log_file_path == "/opt/omnia/log/build_stream/job-123/local_repo_20260125_150000.log"

    def test_get_stage_with_error_and_log_path(self):
        """Test method."""
        data = {
            "stage_name": "build-image-x86_64",
            "stage_state": "FAILED",
            "started_at": "2026-01-25T15:00:00Z",
            "ended_at": "2026-01-25T15:05:00Z",
            "error_code": "BUILD_FAILED",
            "error_summary": "Build process failed",
            "log_file_path": "/opt/omnia/log/build_stream/job-123/build_image_x86_64_20260125_150000.log",
        }

        stage = GetStageResponse(**data)

        assert stage.error_code == "BUILD_FAILED"
        assert stage.log_file_path == "/opt/omnia/log/build_stream/job-123/build_image_x86_64_20260125_150000.log"


class TestGetJobResponse:
    """Test class."""

    def test_valid_get_job_response(self):
        """Test method."""
        data = {
            "job_id": "019bf590-1234-7890-abcd-ef1234567890",
            "correlation_id": "019bf590-5678-7890-abcd-ef1234567890",
            "job_state": "CREATED",
            "created_at": "2026-01-25T15:00:00+00:00",
            "stages": []
        }

        response = GetJobResponse(**data)

        assert response.job_id == "019bf590-1234-7890-abcd-ef1234567890"
        assert response.stages == []


class TestErrorResponse:
    """Test class."""

    def test_valid_error_response(self):
        """Test method."""
        data = {
            "error": "VALIDATION_ERROR",
            "message": "Invalid request",
            "correlation_id": "019bf590-1234-7890-abcd-ef1234567890",
            "timestamp": "2026-01-25T15:00:00Z",
        }

        response = ErrorResponse(**data)

        assert response.error == "VALIDATION_ERROR"
        assert response.message == "Invalid request"
        assert response.correlation_id == "019bf590-1234-7890-abcd-ef1234567890"

    def test_error_response_missing_required_field(self):
        """Test method."""
        data = {
            "error": "VALIDATION_ERROR",
            "message": "Invalid request",
        }

        with pytest.raises(ValidationError):
            ErrorResponse(**data)


================================================
FILE: build_stream/tests/unit/api/local_repo/test_local_repo_dependencies.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for local repository API dependencies."""

import uuid
from unittest.mock import MagicMock

import pytest
from fastapi import HTTPException

from api.local_repo.dependencies import (
    get_local_repo_correlation_id,
    get_create_local_repo_use_case,
)
from core.jobs.value_objects import CorrelationId


class TestGetCorrelationId:
    """Tests for get_local_repo_correlation_id dependency."""

    def test_get_correlation_id_from_header(self):
        """Test getting correlation ID from X-Correlation-Id header."""
        correlation_id = str(uuid.uuid4())

        result = get_local_repo_correlation_id(correlation_id)

        assert isinstance(result, CorrelationId)
        assert str(result) == correlation_id

    def test_get_correlation_id_generates_new_id(self):
        """Test that new correlation ID is generated when not provided."""
        result = get_local_repo_correlation_id(None)

        assert isinstance(result, CorrelationId)
        assert str(result) is not None
        assert len(str(result)) > 0

    def test_get_correlation_id_empty_string(self):
        """Test that empty string generates new correlation ID."""
        result = get_local_repo_correlation_id("")

        assert isinstance(result, CorrelationId)
        assert str(result) is not None
        assert str(result) != ""

    def test_get_correlation_id_whitespace_only(self):
        """Test that whitespace-only string generates new correlation ID."""
        result = get_local_repo_correlation_id("   ")

        assert isinstance(result, CorrelationId)
        assert str(result) is not None
        assert str(result) != "   "


class TestGetCreateLocalRepoUseCase:
    """Tests for get_create_local_repo_use_case dependency."""

    def test_returns_use_case_instance(self):
        """Test that dependency returns use case instance."""
        use_case = get_create_local_repo_use_case()

        assert use_case is not None
        assert hasattr(use_case, 'execute')
        assert callable(use_case.execute)

    def test_use_case_is_factory(self):
        """Test that use case is created from factory (not singleton)."""
        use_case1 = get_create_local_repo_use_case()
        use_case2 = get_create_local_repo_use_case()

        # Factory creates new instances
        assert use_case1 is not use_case2
        assert type(use_case1) == type(use_case2)


class TestGetCreateLocalRepoUseCaseFactory:
    """Tests for get_create_local_repo_use_case dependency factory behavior."""

    def test_returns_callable(self):
        """Test that get_create_local_repo_use_case is callable."""
        assert callable(get_create_local_repo_use_case)


================================================
FILE: build_stream/tests/unit/api/local_repo/test_local_repo_schemas.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for local repository API schemas."""

import uuid
from datetime import datetime, timezone
from unittest.mock import MagicMock

import pytest
from pydantic import ValidationError

from api.local_repo.schemas import (
    CreateLocalRepoResponse,
    LocalRepoErrorResponse,
)


class TestCreateLocalRepoResponse:
    """Tests for CreateLocalRepoResponse schema."""

    @pytest.fixture
    def valid_response_data(self):
        """Provide valid response data."""
        return {
            "job_id": str(uuid.uuid4()),
            "stage": "create-local-repository",
            "status": "accepted",
            "submitted_at": datetime.now(timezone.utc).isoformat(),
            "correlation_id": str(uuid.uuid4()),
        }

    def test_valid_response(self, valid_response_data):
        """Test creating valid response."""
        response = CreateLocalRepoResponse(**valid_response_data)

        assert response.job_id == valid_response_data["job_id"]
        assert response.stage == valid_response_data["stage"]
        assert response.status == valid_response_data["status"]
        assert response.submitted_at == valid_response_data["submitted_at"]
        assert response.correlation_id == valid_response_data["correlation_id"]


    def test_accepts_string_values(self, valid_response_data):
        """Test that schema accepts string values without validation."""
        # Schema accepts strings, validation happens at API layer
        valid_response_data["job_id"] = "any-string"
        valid_response_data["stage"] = "any-stage"
        valid_response_data["status"] = "any-status"

        response = CreateLocalRepoResponse(**valid_response_data)
        assert response.job_id == "any-string"
        assert response.stage == "any-stage"
        assert response.status == "any-status"

    def test_invalid_datetime_format(self, valid_response_data):
        """Test that datetime field accepts string format."""
        # Schema accepts string, actual validation happens at API layer
        valid_response_data["submitted_at"] = "2026-02-10T07:00:00Z"

        response = CreateLocalRepoResponse(**valid_response_data)
        assert response.submitted_at == "2026-02-10T07:00:00Z"

    def test_missing_required_fields(self):
        """Test that missing required fields raise validation error."""
        with pytest.raises(ValidationError) as exc_info:
            CreateLocalRepoResponse()

        errors = exc_info.value.errors()
        assert len(errors) == 5  # All 5 fields are required
        field_names = {error["loc"][0] for error in errors}
        assert field_names == {"job_id", "stage", "status", "submitted_at", "correlation_id"}

    def test_response_serialization(self, valid_response_data):
        """Test response serialization to JSON."""
        response = CreateLocalRepoResponse(**valid_response_data)

        json_data = response.model_dump_json()

        assert isinstance(json_data, str)
        assert "job_id" in json_data
        assert "stage" in json_data
        assert "status" in json_data

    def test_response_deserialization(self, valid_response_data):
        """Test response deserialization from JSON."""
        response = CreateLocalRepoResponse(**valid_response_data)

        json_data = response.model_dump_json()
        restored_response = CreateLocalRepoResponse.model_validate_json(json_data)

        assert restored_response.job_id == response.job_id
        assert restored_response.stage == response.stage
        assert restored_response.status == response.status
        assert restored_response.submitted_at == response.submitted_at
        assert restored_response.correlation_id == response.correlation_id


class TestLocalRepoErrorResponse:
    """Tests for LocalRepoErrorResponse schema."""

    def test_valid_error_response(self):
        """Test creating valid error response."""
        error_response = LocalRepoErrorResponse(
            error="VALIDATION_ERROR",
            message="Invalid input provided",
            correlation_id=str(uuid.uuid4()),
            timestamp=datetime.now(timezone.utc).isoformat(),
        )

        assert error_response.error == "VALIDATION_ERROR"
        assert error_response.message == "Invalid input provided"
        assert error_response.correlation_id is not None
        assert error_response.timestamp is not None

    def test_error_response_serialization(self):
        """Test error response serialization."""
        error_response = LocalRepoErrorResponse(
            error="TEST_ERROR",
            message="Test error message",
            correlation_id=str(uuid.uuid4()),
            timestamp=datetime.now(timezone.utc).isoformat(),
        )

        json_data = error_response.model_dump_json()

        assert isinstance(json_data, str)
        assert "error" in json_data
        assert "message" in json_data

    def test_error_response_with_special_characters(self):
        """Test error response with special characters in message."""
        error_response = LocalRepoErrorResponse(
            error="SPECIAL_ERROR",
            message="Error with special chars: !@#$%^&*()_+-=[]{}|;':\",./<>?",
            correlation_id=str(uuid.uuid4()),
            timestamp=datetime.now(timezone.utc).isoformat(),
        )

        assert error_response.message == "Error with special chars: !@#$%^&*()_+-=[]{}|;':\",./<>?"


================================================
FILE: build_stream/tests/unit/api/local_repo/test_routes.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for local repository API routes."""

import uuid
from unittest.mock import AsyncMock, MagicMock

import pytest
from fastapi import FastAPI, HTTPException
from fastapi.testclient import TestClient

from api.local_repo.routes import router
from core.jobs.exceptions import JobNotFoundError
from core.jobs.value_objects import JobId
from core.localrepo.exceptions import (
    InputDirectoryInvalidError,
    InputFilesMissingError,
    QueueUnavailableError,
)
from api.local_repo.schemas import CreateLocalRepoResponse
from orchestrator.local_repo.dtos import LocalRepoResponse


class TestCreateLocalRepositoryRoute:
    """Tests for POST /api/v1/jobs/{job_id}/stages/create-local-repository."""

    @pytest.fixture
    def mock_use_case(self):
        """Mock CreateLocalRepoUseCase."""
        use_case = MagicMock()
        use_case.execute = MagicMock()
        return use_case

    @pytest.fixture
    def job_id(self):
        """Provide a valid job ID."""
        return str(uuid.uuid4())

    def test_success_response(self, mock_use_case, job_id):
        """Test successful API call returns 202."""
        # Setup mock response
        expected_response = LocalRepoResponse(
            job_id=job_id,
            stage_name="create-local-repository",
            status="accepted",
            submitted_at="2026-02-10T07:00:00Z",
            correlation_id=str(uuid.uuid4()),
        )
        mock_use_case.execute.return_value = expected_response

        # Create app with dependency override
        from api.local_repo.dependencies import get_create_local_repo_use_case
        from api.dependencies import verify_token
        app = FastAPI()
        app.include_router(router, prefix="/api/v1")
        app.dependency_overrides[get_create_local_repo_use_case] = lambda: mock_use_case
        app.dependency_overrides[verify_token] = lambda: {"sub": "test-client", "client_id": "test-client-id", "scopes": ["job:write"]}
        client = TestClient(app)

        # Make request
        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/create-local-repository",
            headers={"Authorization": "Bearer test-token", "X-Correlation-Id": str(uuid.uuid4())},
        )

        # Verify response
        assert response.status_code == 202
        response_data = response.json()
        assert response_data["job_id"] == job_id
        assert response_data["stage"] == "create-local-repository"
        assert response_data["status"] == "accepted"
        assert "submitted_at" in response_data
        assert "correlation_id" in response_data

    def test_job_not_found_returns_404(self, mock_use_case, job_id):
        """Test that JobNotFoundError returns 404."""
        # Setup mock to raise exception
        mock_use_case.execute.side_effect = JobNotFoundError(job_id=JobId(job_id))

        # Create app with dependency override
        from api.local_repo.dependencies import get_create_local_repo_use_case
        from api.dependencies import verify_token
        app = FastAPI()
        app.include_router(router, prefix="/api/v1")
        app.dependency_overrides[get_create_local_repo_use_case] = lambda: mock_use_case
        app.dependency_overrides[verify_token] = lambda: {"sub": "test-client", "client_id": "test-client-id", "scopes": ["job:write"]}
        client = TestClient(app)

        # Make request
        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/create-local-repository",
            headers={"Authorization": "Bearer test-token"},
        )

        # Verify response
        assert response.status_code == 404
        response_data = response.json()
        assert response_data["detail"]["error"] == "JOB_NOT_FOUND"

    def test_input_files_missing_returns_400(self, mock_use_case, job_id):
        """Test that InputFilesMissingError returns 400."""
        # Setup mock to raise exception
        mock_use_case.execute.side_effect = InputFilesMissingError(
            job_id=JobId(job_id),
            input_path="/input/path",
            correlation_id=str(uuid.uuid4()),
        )

        # Create app with dependency override
        from api.local_repo.dependencies import get_create_local_repo_use_case
        from api.dependencies import verify_token
        app = FastAPI()
        app.include_router(router, prefix="/api/v1")
        app.dependency_overrides[get_create_local_repo_use_case] = lambda: mock_use_case
        app.dependency_overrides[verify_token] = lambda: {"sub": "test-client", "client_id": "test-client-id", "scopes": ["job:write"]}
        client = TestClient(app)

        # Make request
        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/create-local-repository",
            headers={"Authorization": "Bearer test-token"},
        )

        # Verify response
        assert response.status_code == 400
        response_data = response.json()
        assert response_data["detail"]["error"] == "INPUT_FILES_MISSING"

    def test_input_directory_invalid_returns_400(self, mock_use_case, job_id):
        """Test that InputDirectoryInvalidError returns 400."""
        # Setup mock to raise exception
        mock_use_case.execute.side_effect = InputDirectoryInvalidError(
            job_id=JobId(job_id),
            input_path="/input/path",
            reason="Directory is empty",
            correlation_id=str(uuid.uuid4()),
        )

        # Create app with dependency override
        from api.local_repo.dependencies import get_create_local_repo_use_case
        from api.dependencies import verify_token
        app = FastAPI()
        app.include_router(router, prefix="/api/v1")
        app.dependency_overrides[get_create_local_repo_use_case] = lambda: mock_use_case
        app.dependency_overrides[verify_token] = lambda: {"sub": "test-client", "client_id": "test-client-id", "scopes": ["job:write"]}
        client = TestClient(app)

        # Make request
        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/create-local-repository",
            headers={"Authorization": "Bearer test-token"},
        )

        # Verify response
        assert response.status_code == 400
        response_data = response.json()
        assert response_data["detail"]["error"] == "INPUT_DIRECTORY_INVALID"

    def test_queue_unavailable_returns_503(self, mock_use_case, job_id):
        """Test that QueueUnavailableError returns 503."""
        # Setup mock to raise exception
        mock_use_case.execute.side_effect = QueueUnavailableError(
            queue_path="/queue/path",
            reason="NFS not mounted",
            correlation_id=str(uuid.uuid4()),
        )

        # Create app with dependency override
        from api.local_repo.dependencies import get_create_local_repo_use_case
        from api.dependencies import verify_token
        app = FastAPI()
        app.include_router(router, prefix="/api/v1")
        app.dependency_overrides[get_create_local_repo_use_case] = lambda: mock_use_case
        app.dependency_overrides[verify_token] = lambda: {"sub": "test-client", "client_id": "test-client-id", "scopes": ["job:write"]}
        client = TestClient(app)

        # Make request
        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/create-local-repository",
            headers={"Authorization": "Bearer test-token"},
        )

        # Verify response
        assert response.status_code == 503
        response_data = response.json()
        assert response_data["detail"]["error"] == "QUEUE_UNAVAILABLE"

    def test_unexpected_exception_returns_500(self, mock_use_case, job_id):
        """Test that unexpected exceptions return 500."""
        # Setup mock to raise exception
        mock_use_case.execute.side_effect = Exception("Unexpected error")

        # Create app with dependency override
        from api.local_repo.dependencies import get_create_local_repo_use_case
        from api.dependencies import verify_token
        app = FastAPI()
        app.include_router(router, prefix="/api/v1")
        app.dependency_overrides[get_create_local_repo_use_case] = lambda: mock_use_case
        app.dependency_overrides[verify_token] = lambda: {"sub": "test-client", "client_id": "test-client-id", "scopes": ["job:write"]}
        client = TestClient(app)

        # Make request
        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/create-local-repository",
            headers={"Authorization": "Bearer test-token"},
        )

        # Verify response
        assert response.status_code == 500
        response_data = response.json()
        assert response_data["detail"]["error"] == "INTERNAL_ERROR"

    def test_invalid_job_id_format_returns_400(self, mock_use_case):
        """Test that invalid job ID format returns 400."""
        # Create app with dependency override
        from api.local_repo.dependencies import get_create_local_repo_use_case
        from api.dependencies import verify_token
        app = FastAPI()
        app.include_router(router, prefix="/api/v1")
        app.dependency_overrides[get_create_local_repo_use_case] = lambda: mock_use_case
        app.dependency_overrides[verify_token] = lambda: {"sub": "test-client", "client_id": "test-client-id", "scopes": ["job:write"]}
        client = TestClient(app)

        # Make request with invalid job ID
        response = client.post(
            "/api/v1/jobs/invalid-uuid/stages/create-local-repository",
            headers={"Authorization": "Bearer test-token"},
        )

        # Verify response
        assert response.status_code == 400
        response_data = response.json()
        assert response_data["detail"]["error"] == "INVALID_JOB_ID"

    def test_missing_authorization_returns_401(self, mock_use_case, job_id):
        """Test that missing authorization returns 401."""
        # Create app with dependency override
        from api.local_repo.dependencies import get_create_local_repo_use_case
        app = FastAPI()
        app.include_router(router, prefix="/api/v1")
        app.dependency_overrides[get_create_local_repo_use_case] = lambda: mock_use_case
        client = TestClient(app)

        # Make request without auth
        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/create-local-repository",
        )

        # Verify response - returns 401 for missing authorization
        assert response.status_code == 401

    def test_correlation_id_header_propagated(self, mock_use_case, job_id):
        """Test that X-Correlation-Id header is propagated."""
        correlation_id = str(uuid.uuid4())

        # Setup mock
        mock_use_case.execute.return_value = LocalRepoResponse(
            job_id=job_id,
            stage_name="create-local-repository",
            status="accepted",
            submitted_at="2026-02-10T07:00:00Z",
            correlation_id=correlation_id,
        )

        # Create app with dependency override
        from api.local_repo.dependencies import get_create_local_repo_use_case
        from api.dependencies import verify_token
        app = FastAPI()
        app.include_router(router, prefix="/api/v1")
        app.dependency_overrides[get_create_local_repo_use_case] = lambda: mock_use_case
        app.dependency_overrides[verify_token] = lambda: {"sub": "test-client", "client_id": "test-client-id", "scopes": ["job:write"]}
        client = TestClient(app)

        # Make request with correlation ID
        response = client.post(
            f"/api/v1/jobs/{job_id}/stages/create-local-repository",
            headers={
                "Authorization": "Bearer test-token",
                "X-Correlation-Id": correlation_id,
            },
        )

        # Verify response
        assert response.status_code == 202
        response_data = response.json()
        assert response_data["correlation_id"] == correlation_id


================================================
FILE: build_stream/tests/unit/api/validate/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for validate API module."""


================================================
FILE: build_stream/tests/unit/api/validate/test_routes.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for ValidateImageOnTest API routes."""

import uuid

import pytest
from fastapi import HTTPException

from api.validate.routes import create_validate_image_on_test, _build_error_response
from api.validate.schemas import (
    ValidateImageOnTestRequest,
)
from core.jobs.exceptions import (
    InvalidStateTransitionError,
    JobNotFoundError,
    UpstreamStageNotCompletedError,
)
from core.jobs.value_objects import ClientId, CorrelationId
from core.validate.exceptions import (
    ValidationExecutionError,
)
from orchestrator.validate.dtos import ValidateImageOnTestResponse as UseCaseResponse


def _uuid():
    return str(uuid.uuid4())


class MockValidateUseCase:
    """Mock use case for testing."""
    # pylint: disable=too-few-public-methods

    def __init__(self, error_to_raise=None):
        self.error_to_raise = error_to_raise
        self.executed_commands = []

    def execute(self, command):
        """Mock execute method."""
        self.executed_commands.append(command)
        if self.error_to_raise:
            raise self.error_to_raise

        return UseCaseResponse(
            job_id=str(command.job_id),
            stage_name="validate-image-on-test",
            status="accepted",
            submitted_at="2026-02-17T10:30:00Z",
            correlation_id=str(command.correlation_id),
        )


class TestBuildErrorResponse:
    """Tests for _build_error_response helper."""
    # pylint: disable=too-few-public-methods

    def test_builds_correct_response(self):
        """Test building correct error response."""
        response = _build_error_response("TEST_ERROR", "Test message", "corr-123")
        assert response.error == "TEST_ERROR"
        assert response.message == "Test message"
        assert response.correlation_id == "corr-123"
        assert "Z" in response.timestamp


class TestCreateValidateImageOnTest:
    """Tests for create_validate_image_on_test route handler."""

    def test_success(self):
        """Test successful response."""
        job_id = _uuid()
        corr_id = _uuid()
        use_case = MockValidateUseCase()
        
        request_body = ValidateImageOnTestRequest(image_key="test-image")
        
        response = create_validate_image_on_test(
            job_id=job_id,
            request_body=request_body,
            token_data={"client_id": "test-client", "scopes": ["job:write"]},
            use_case=use_case,
            correlation_id=CorrelationId(corr_id),
            _=None,
        )

        assert response.job_id == job_id
        assert response.stage == "validate-image-on-test"
        assert response.status == "accepted"
        assert response.correlation_id == corr_id
        assert "submitted_at" in response.model_dump()

        # Verify command was created correctly
        assert len(use_case.executed_commands) == 1
        command = use_case.executed_commands[0]
        assert str(command.job_id) == job_id
        assert str(command.client_id) == "test-client"
        assert str(command.correlation_id) == corr_id

    def test_invalid_job_id(self):
        """Invalid job_id should raise 400."""
        use_case = MockValidateUseCase()
        corr_id = _uuid()

        with pytest.raises(HTTPException) as exc_info:
            create_validate_image_on_test(
                job_id="not-a-uuid",
                request_body=ValidateImageOnTestRequest(image_key="test-image"),
                token_data={"client_id": "test-client", "scopes": ["job:write"]},
                use_case=use_case,
                correlation_id=CorrelationId(corr_id),
                _=None,
            )
        assert exc_info.value.status_code == 400
        assert exc_info.value.detail["error"] == "INVALID_JOB_ID"

    def test_job_not_found(self):
        """JobNotFoundError should raise 404."""
        use_case = MockValidateUseCase(
            error_to_raise=JobNotFoundError(job_id=_uuid())
        )
        corr_id = _uuid()

        with pytest.raises(HTTPException) as exc_info:
            create_validate_image_on_test(
                job_id=_uuid(),
                request_body=ValidateImageOnTestRequest(image_key="test-image"),
                token_data={"client_id": "test-client", "scopes": ["job:write"]},
                use_case=use_case,
                correlation_id=CorrelationId(corr_id),
                _=None,
            )
        assert exc_info.value.status_code == 404
        assert exc_info.value.detail["error"] == "JOB_NOT_FOUND"

    def test_invalid_state_transition(self):
        """InvalidStateTransitionError should raise 409."""
        use_case = MockValidateUseCase(
            error_to_raise=InvalidStateTransitionError(
                entity_type="Stage",
                entity_id="test",
                from_state="COMPLETED",
                to_state="IN_PROGRESS",
            )
        )
        corr_id = _uuid()

        with pytest.raises(HTTPException) as exc_info:
            create_validate_image_on_test(
                job_id=_uuid(),
                request_body=ValidateImageOnTestRequest(image_key="test-image"),
                token_data={"client_id": "test-client", "scopes": ["job:write"]},
                use_case=use_case,
                correlation_id=CorrelationId(corr_id),
                _=None,
            )
        assert exc_info.value.status_code == 409
        assert exc_info.value.detail["error"] == "INVALID_STATE_TRANSITION"

    def test_upstream_stage_not_completed(self):
        """UpstreamStageNotCompletedError should raise 422."""
        use_case = MockValidateUseCase(
            error_to_raise=UpstreamStageNotCompletedError(
                job_id="test-job-id",
                required_stage="build-image-x86_64 or build-image-aarch64",
                actual_state="x86_64: PENDING, aarch64: NOT_FOUND",
                correlation_id="corr-123"
            )
        )
        corr_id = _uuid()

        with pytest.raises(HTTPException) as exc_info:
            create_validate_image_on_test(
                job_id=_uuid(),
                request_body=ValidateImageOnTestRequest(image_key="test-image"),
                token_data={"client_id": "test-client", "scopes": ["job:write"]},
                use_case=use_case,
                correlation_id=CorrelationId(corr_id),
                _=None,
            )
        assert exc_info.value.status_code == 412
        assert exc_info.value.detail["error"] == "UPSTREAM_STAGE_NOT_COMPLETED"

    def test_validation_execution_error(self):
        """ValidationExecutionError should raise 500."""
        use_case = MockValidateUseCase(
            error_to_raise=ValidationExecutionError(
                "Queue failed", "corr-123"
            )
        )
        corr_id = _uuid()

        with pytest.raises(HTTPException) as exc_info:
            create_validate_image_on_test(
                job_id=_uuid(),
                request_body=ValidateImageOnTestRequest(image_key="test-image"),
                token_data={"client_id": "test-client", "scopes": ["job:write"]},
                use_case=use_case,
                correlation_id=CorrelationId(corr_id),
                _=None,
            )
        assert exc_info.value.status_code == 500
        assert exc_info.value.detail["error"] == "VALIDATION_EXECUTION_ERROR"

    def test_unexpected_error(self):
        """Unexpected errors should raise 500."""
        use_case = MockValidateUseCase(
            error_to_raise=RuntimeError("unexpected")
        )
        corr_id = _uuid()

        with pytest.raises(HTTPException) as exc_info:
            create_validate_image_on_test(
                job_id=_uuid(),
                request_body=ValidateImageOnTestRequest(image_key="test-image"),
                token_data={"client_id": "test-client", "scopes": ["job:write"]},
                use_case=use_case,
                correlation_id=CorrelationId(corr_id),
                _=None,
            )
        assert exc_info.value.status_code == 500


================================================
FILE: build_stream/tests/unit/core/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for core domain layer."""


================================================
FILE: build_stream/tests/unit/core/artifacts/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.


================================================
FILE: build_stream/tests/unit/core/artifacts/conftest.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Shared fixtures for artifact domain tests."""

import pytest

from core.artifacts.value_objects import (
    ArtifactDigest,
    ArtifactKey,
    ArtifactKind,
    ArtifactRef,
    StoreHint,
)


VALID_DIGEST = "a" * 64  # valid 64-char lowercase hex


@pytest.fixture
def valid_artifact_key() -> ArtifactKey:
    """A valid artifact key."""
    return ArtifactKey("catalog/abc123def456/catalog-file.bin")


@pytest.fixture
def valid_digest() -> ArtifactDigest:
    """A valid SHA-256 digest."""
    return ArtifactDigest(VALID_DIGEST)


@pytest.fixture
def valid_store_hint() -> StoreHint:
    """A valid store hint."""
    return StoreHint(
        namespace="catalog",
        label="catalog-file",
        tags={"job_id": "018f3c4b-7b5b-7a9d-b6c4-9f3b4f9b2c10"},
    )


@pytest.fixture
def valid_artifact_ref(valid_artifact_key, valid_digest) -> ArtifactRef:
    """A valid artifact reference."""
    return ArtifactRef(
        key=valid_artifact_key,
        digest=valid_digest,
        size_bytes=1024,
        uri="memory://catalog/abc123def456/catalog-file.bin",
    )


================================================
FILE: build_stream/tests/unit/core/artifacts/test_exceptions.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for Artifact domain exceptions."""

import pytest

from core.artifacts.exceptions import (
    ArtifactAlreadyExistsError,
    ArtifactDomainError,
    ArtifactNotFoundError,
    ArtifactStoreError,
    ArtifactValidationError,
)


class TestArtifactDomainError:
    """Tests for ArtifactDomainError base exception."""

    def test_base_error_with_message_only(self) -> None:
        error = ArtifactDomainError("Test message")
        assert error.message == "Test message"
        assert error.correlation_id is None
        assert str(error) == "Test message"

    def test_base_error_with_correlation_id(self) -> None:
        correlation_id = "018f3c4b-7b5b-7a9d-b6c4-9f3b4f9b2c10"
        error = ArtifactDomainError("Test message", correlation_id)
        assert error.message == "Test message"
        assert error.correlation_id == correlation_id
        assert str(error) == "Test message"

    def test_inheritance_from_exception(self) -> None:
        error = ArtifactDomainError("Test")
        assert isinstance(error, Exception)
        assert isinstance(error, ArtifactDomainError)


class TestArtifactNotFoundError:
    """Tests for ArtifactNotFoundError."""

    def test_error_with_key_only(self) -> None:
        error = ArtifactNotFoundError("catalog/missing-file.json")
        assert error.key == "catalog/missing-file.json"
        assert error.correlation_id is None
        assert "Artifact not found: catalog/missing-file.json" in str(error)

    def test_error_with_correlation_id(self) -> None:
        correlation_id = "018f3c4b-7b5b-7a9d-b6c4-9f3b4f9b2c10"
        error = ArtifactNotFoundError("catalog/missing-file.json", correlation_id)
        assert error.key == "catalog/missing-file.json"
        assert error.correlation_id == correlation_id
        assert error.correlation_id == correlation_id

    def test_inheritance_from_domain_error(self) -> None:
        error = ArtifactNotFoundError("test-key")
        assert isinstance(error, ArtifactDomainError)
        assert isinstance(error, Exception)


class TestArtifactAlreadyExistsError:
    """Tests for ArtifactAlreadyExistsError."""

    def test_error_with_key_only(self) -> None:
        error = ArtifactAlreadyExistsError("catalog/existing-file.json")
        assert error.key == "catalog/existing-file.json"
        assert error.correlation_id is None
        assert "Artifact already exists: catalog/existing-file.json" in str(error)

    def test_error_with_correlation_id(self) -> None:
        correlation_id = "018f3c4b-7b5b-7a9d-b6c4-9f3b4f9b2c10"
        error = ArtifactAlreadyExistsError("catalog/existing-file.json", correlation_id)
        assert error.key == "catalog/existing-file.json"
        assert error.correlation_id == correlation_id

    def test_inheritance_from_domain_error(self) -> None:
        error = ArtifactAlreadyExistsError("test-key")
        assert isinstance(error, ArtifactDomainError)
        assert isinstance(error, Exception)


class TestArtifactStoreError:
    """Tests for ArtifactStoreError."""

    def test_error_with_message_only(self) -> None:
        error = ArtifactStoreError("Store connection failed")
        assert error.message == "Store connection failed"
        assert error.correlation_id is None
        assert "Store connection failed" in str(error)

    def test_error_with_correlation_id(self) -> None:
        correlation_id = "018f3c4b-7b5b-7a9d-b6c4-9f3b4f9b2c10"
        error = ArtifactStoreError("Store connection failed", correlation_id)
        assert error.message == "Store connection failed"
        assert error.correlation_id == correlation_id

    def test_inheritance_from_domain_error(self) -> None:
        error = ArtifactStoreError("Store error")
        assert isinstance(error, ArtifactDomainError)
        assert isinstance(error, Exception)


class TestArtifactValidationError:
    """Tests for ArtifactValidationError."""

    def test_error_with_message_only(self) -> None:
        error = ArtifactValidationError("File size exceeds limit")
        assert error.message == "File size exceeds limit"
        assert error.correlation_id is None
        assert "File size exceeds limit" in str(error)

    def test_error_with_correlation_id(self) -> None:
        correlation_id = "018f3c4b-7b5b-7a9d-b6c4-9f3b4f9b2c10"
        error = ArtifactValidationError("File size exceeds limit", correlation_id)
        assert error.message == "File size exceeds limit"
        assert error.correlation_id == correlation_id

    def test_inheritance_from_domain_error(self) -> None:
        error = ArtifactValidationError("Validation error")
        assert isinstance(error, ArtifactDomainError)
        assert isinstance(error, Exception)


================================================
FILE: build_stream/tests/unit/core/artifacts/test_value_objects.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for Artifact domain value objects."""

from dataclasses import FrozenInstanceError
from pathlib import Path

import pytest

from core.artifacts.value_objects import (
    ArtifactDigest,
    ArtifactKey,
    ArtifactKind,
    ArtifactRef,
    SafePath,
    StoreHint,
)


# ---------------------------------------------------------------------------
# SafePath
# ---------------------------------------------------------------------------

class TestSafePath:
    """Tests for SafePath value object."""

    def test_valid_path(self) -> None:
        sp = SafePath(value=Path("/opt/artifacts/store"))
        assert sp.value == Path("/opt/artifacts/store")

    def test_from_string(self) -> None:
        sp = SafePath.from_string("/opt/artifacts/store")
        assert sp.value == Path("/opt/artifacts/store")

    def test_empty_path_raises(self) -> None:
        with pytest.raises(ValueError, match="cannot be empty"):
            SafePath(value=Path(""))

    def test_whitespace_only_raises(self) -> None:
        with pytest.raises(ValueError, match="cannot be empty"):
            SafePath(value=Path("   "))

    def test_path_too_long_raises(self) -> None:
        long_path = "a" * (SafePath.MAX_LENGTH + 1)
        with pytest.raises(ValueError, match="cannot exceed"):
            SafePath.from_string(long_path)

    def test_traversal_dot_dot_raises(self) -> None:
        with pytest.raises(ValueError, match="traversal"):
            SafePath.from_string("/opt/../etc/passwd")

    def test_relative_path_with_dots_in_name_allowed(self) -> None:
        sp = SafePath.from_string("/opt/my..file.tar.gz")
        assert "my..file.tar.gz" in str(sp)

    def test_traversal_encoded_raises(self) -> None:
        with pytest.raises(ValueError, match="traversal"):
            SafePath.from_string("/opt/%2e%2e/etc")

    def test_null_byte_raises(self) -> None:
        with pytest.raises(ValueError, match="null bytes"):
            SafePath.from_string("/opt/file\x00.json")

    def test_immutable(self) -> None:
        sp = SafePath(value=Path("/opt/store"))
        with pytest.raises(FrozenInstanceError):
            sp.value = Path("/other")  # type: ignore[misc]

    def test_str_representation(self) -> None:
        sp = SafePath.from_string("/opt/store")
        assert str(sp) == str(Path("/opt/store"))


# ---------------------------------------------------------------------------
# ArtifactKey
# ---------------------------------------------------------------------------

class TestArtifactKey:
    """Tests for ArtifactKey value object."""

    def test_valid_key(self) -> None:
        key = ArtifactKey("catalog/abc123/file.bin")
        assert key.value == "catalog/abc123/file.bin"

    def test_empty_key_raises(self) -> None:
        with pytest.raises(ValueError, match="cannot be empty"):
            ArtifactKey("")

    def test_whitespace_key_raises(self) -> None:
        with pytest.raises(ValueError, match="cannot be empty"):
            ArtifactKey("   ")

    def test_key_too_long_raises(self) -> None:
        with pytest.raises(ValueError, match="cannot exceed"):
            ArtifactKey("a" * 513)

    def test_traversal_dot_dot_raises(self) -> None:
        with pytest.raises(ValueError, match="traversal"):
            ArtifactKey("../../../etc/passwd")

    def test_traversal_backslash_raises(self) -> None:
        with pytest.raises(ValueError, match="traversal or backslash"):
            ArtifactKey("catalog\\file.bin")

    def test_absolute_path_raises(self) -> None:
        with pytest.raises(ValueError, match="absolute path"):
            ArtifactKey("/etc/passwd")

    def test_null_byte_raises(self) -> None:
        with pytest.raises(ValueError, match="null bytes"):
            ArtifactKey("file\x00.json")

    def test_immutable(self) -> None:
        key = ArtifactKey("catalog/file.bin")
        with pytest.raises(FrozenInstanceError):
            key.value = "other"  # type: ignore[misc]

    def test_str_representation(self) -> None:
        key = ArtifactKey("catalog/file.bin")
        assert str(key) == "catalog/file.bin"


# ---------------------------------------------------------------------------
# ArtifactDigest
# ---------------------------------------------------------------------------

class TestArtifactDigest:
    """Tests for ArtifactDigest value object."""

    def test_valid_digest(self) -> None:
        digest = ArtifactDigest("a" * 64)
        assert digest.value == "a" * 64

    def test_short_digest_raises(self) -> None:
        with pytest.raises(ValueError, match="Invalid SHA-256"):
            ArtifactDigest("a" * 63)

    def test_long_digest_raises(self) -> None:
        with pytest.raises(ValueError, match="cannot exceed"):
            ArtifactDigest("a" * 65)

    def test_uppercase_raises(self) -> None:
        with pytest.raises(ValueError, match="Invalid SHA-256"):
            ArtifactDigest("A" * 64)

    def test_non_hex_raises(self) -> None:
        with pytest.raises(ValueError, match="Invalid SHA-256"):
            ArtifactDigest("g" * 64)

    def test_immutable(self) -> None:
        digest = ArtifactDigest("a" * 64)
        with pytest.raises(FrozenInstanceError):
            digest.value = "b" * 64  # type: ignore[misc]

    def test_str_representation(self) -> None:
        digest = ArtifactDigest("a" * 64)
        assert str(digest) == "a" * 64


# ---------------------------------------------------------------------------
# ArtifactRef
# ---------------------------------------------------------------------------

class TestArtifactRef:
    """Tests for ArtifactRef value object."""

    def test_valid_ref(self, valid_artifact_key, valid_digest) -> None:
        ref = ArtifactRef(
            key=valid_artifact_key,
            digest=valid_digest,
            size_bytes=1024,
            uri="memory://test",
        )
        assert ref.size_bytes == 1024

    def test_zero_size_allowed(self, valid_artifact_key, valid_digest) -> None:
        ref = ArtifactRef(
            key=valid_artifact_key,
            digest=valid_digest,
            size_bytes=0,
            uri="memory://test",
        )
        assert ref.size_bytes == 0

    def test_negative_size_raises(self, valid_artifact_key, valid_digest) -> None:
        with pytest.raises(ValueError, match="non-negative"):
            ArtifactRef(
                key=valid_artifact_key,
                digest=valid_digest,
                size_bytes=-1,
                uri="memory://test",
            )

    def test_empty_uri_raises(self, valid_artifact_key, valid_digest) -> None:
        with pytest.raises(ValueError, match="URI cannot be empty"):
            ArtifactRef(
                key=valid_artifact_key,
                digest=valid_digest,
                size_bytes=100,
                uri="",
            )

    def test_uri_too_long_raises(self, valid_artifact_key, valid_digest) -> None:
        with pytest.raises(ValueError, match="URI length cannot exceed"):
            ArtifactRef(
                key=valid_artifact_key,
                digest=valid_digest,
                size_bytes=100,
                uri="x" * 4097,
            )

    def test_immutable(self, valid_artifact_ref) -> None:
        with pytest.raises(FrozenInstanceError):
            valid_artifact_ref.size_bytes = 999  # type: ignore[misc]


# ---------------------------------------------------------------------------
# ArtifactKind
# ---------------------------------------------------------------------------

class TestArtifactKind:
    """Tests for ArtifactKind enum."""

    def test_file_value(self) -> None:
        assert ArtifactKind.FILE.value == "FILE"

    def test_archive_value(self) -> None:
        assert ArtifactKind.ARCHIVE.value == "ARCHIVE"

    def test_string_comparison(self) -> None:
        assert ArtifactKind.FILE == "FILE"
        assert ArtifactKind.ARCHIVE == "ARCHIVE"


# ---------------------------------------------------------------------------
# StoreHint
# ---------------------------------------------------------------------------

class TestStoreHint:
    """Tests for StoreHint value object."""

    def test_valid_hint(self) -> None:
        hint = StoreHint(
            namespace="catalog",
            label="catalog-file",
            tags={"job_id": "018f3c4b-7b5b-7a9d-b6c4-9f3b4f9b2c10"},
        )
        assert hint.namespace == "catalog"
        assert hint.label == "catalog-file"

    def test_empty_namespace_raises(self) -> None:
        with pytest.raises(ValueError, match="namespace cannot be empty"):
            StoreHint(namespace="", label="file", tags={})

    def test_namespace_too_long_raises(self) -> None:
        with pytest.raises(ValueError, match="namespace length cannot exceed"):
            StoreHint(namespace="a" * 129, label="file", tags={})

    def test_empty_label_raises(self) -> None:
        with pytest.raises(ValueError, match="label cannot be empty"):
            StoreHint(namespace="ns", label="", tags={})

    def test_label_too_long_raises(self) -> None:
        with pytest.raises(ValueError, match="label length cannot exceed"):
            StoreHint(namespace="ns", label="a" * 129, tags={})

    def test_too_many_tags_raises(self) -> None:
        tags = {f"key{i}": f"val{i}" for i in range(21)}
        with pytest.raises(ValueError, match="cannot have more than"):
            StoreHint(namespace="ns", label="file", tags=tags)

    def test_tag_key_too_long_raises(self) -> None:
        with pytest.raises(ValueError, match="Tag key length"):
            StoreHint(namespace="ns", label="file", tags={"k" * 65: "v"})

    def test_tag_value_too_long_raises(self) -> None:
        with pytest.raises(ValueError, match="Tag value length"):
            StoreHint(namespace="ns", label="file", tags={"k": "v" * 257})

    def test_empty_tags_allowed(self) -> None:
        hint = StoreHint(namespace="ns", label="file", tags={})
        assert hint.tags == {}

    def test_immutable(self) -> None:
        hint = StoreHint(namespace="ns", label="file", tags={})
        with pytest.raises(FrozenInstanceError):
            hint.namespace = "other"  # type: ignore[misc]


================================================
FILE: build_stream/tests/unit/core/build_image/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


================================================
FILE: build_stream/tests/unit/core/build_image/test_entities.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for Build Image entities."""

import json
from datetime import datetime, timezone

import pytest

from core.build_image.entities import BuildImageRequest
from core.build_image.value_objects import FunctionalGroups, ImageKey
from core.localrepo.value_objects import ExecutionTimeout, ExtraVars, PlaybookPath


class TestBuildImageRequest:
    """Test cases for BuildImageRequest entity."""

    @pytest.fixture
    def sample_request(self):
        """Create a sample BuildImageRequest for testing."""
        return BuildImageRequest(
            job_id="job-123",
            stage_name="build-image",
            playbook_path=PlaybookPath("build_image_x86_64.yml"),
            extra_vars=ExtraVars(
                {
                    "job_id": "job-123",
                    "image_key": ImageKey("test-image").value,
                    "functional_groups": FunctionalGroups(["service_kube_control_plane_x86_64_first", "service_kube_control_plane_x86_64", "service_kube_node_x86_64"]).to_list(),
                }
            ),
            correlation_id="corr-456",
            timeout=ExecutionTimeout(60),
            submitted_at="2026-02-12T18:30:00.000Z",
            request_id="req-789",
        )

    @pytest.mark.parametrize(
        "functional_groups",
        [
            (
                "service_kube_control_plane_x86_64_first",
                "service_kube_control_plane_x86_64",
                "service_kube_node_x86_64",
            )
        ],
    )
    def test_to_dict(self, functional_groups):
        """Test serialization to dictionary."""
        request = BuildImageRequest(
            job_id="job-123",
            stage_name="build-image",
            playbook_path=PlaybookPath("build_image_x86_64.yml"),
            extra_vars=ExtraVars(
                {
                    "job_id": "job-123",
                    "image_key": ImageKey("test-image").value,
                    "functional_groups": list(functional_groups),
                }
            ),
            correlation_id="corr-456",
            timeout=ExecutionTimeout(60),
            submitted_at="2026-02-12T18:30:00.000Z",
            request_id="req-789",
        )

        result = request.to_dict()

        assert result["job_id"] == "job-123"
        assert result["stage_name"] == "build-image"
        assert result["extra_vars"]["job_id"] == "job-123"
        assert result["extra_vars"]["image_key"] == "test-image"
        assert result["extra_vars"]["functional_groups"] == list(functional_groups)
        assert result["playbook_path"] == "build_image_x86_64.yml"
        assert result["correlation_id"] == "corr-456"
        assert result["timeout_minutes"] == 60
        assert result["submitted_at"] == "2026-02-12T18:30:00.000Z"
        assert result["request_id"] == "req-789"
        assert "inventory_host" not in result

    @pytest.mark.parametrize(
        ("image_key_value", "inventory_host_value"),
        [("test-image", "192.168.1.100")],
    )
    def test_to_dict_with_inventory_host(self, image_key_value, inventory_host_value):
        """Test serialization to dictionary with inventory host."""
        request = BuildImageRequest(
            job_id="job-123",
            stage_name="build-image",
            playbook_path=PlaybookPath("build_image_aarch64.yml"),
            extra_vars=ExtraVars(
                {
                    "job_id": "job-123",
                    "image_key": ImageKey(image_key_value).value,
                    "functional_groups": FunctionalGroups(["group1"]).to_list(),
                    "inventory_host": inventory_host_value,
                }
            ),
            correlation_id="corr-456",
            timeout=ExecutionTimeout(60),
            submitted_at="2026-02-12T18:30:00.000Z",
            request_id="req-789",
        )

        result = request.to_dict()
        assert result["extra_vars"]["inventory_host"] == inventory_host_value

    def test_generate_filename(self, sample_request):
        """Test filename generation."""
        filename = sample_request.generate_filename()
        assert filename.startswith("job-123_build-image_")
        assert filename.endswith(".json")
        # Should include timestamp
        assert len(filename) > len("job-123_build-image_.json")

    def test_get_playbook_command_x86_64(self, sample_request):
        """Test playbook command generation for x86_64."""
        command = sample_request.get_playbook_command()

        assert "ansible-playbook" in command
        assert "build_image_x86_64.yml" in command
        assert '-e job_id="job-123"' in command
        assert '-e image_key="test-image"' in command
        assert "functional_groups=" in command
        assert "-i " not in command  # No inventory for x86_64

    @pytest.mark.parametrize(
        (
            "job_id_value",
            "image_key_value",
            "functional_groups_value",
            "inventory_host_value",
        ),
        [("job-123", "test-image", ["group1"], "10.3.1.100")],
    )
    def test_get_playbook_command_aarch64(
        self,
        job_id_value,
        image_key_value,
        functional_groups_value,
        inventory_host_value,
    ):
        """Test playbook command generation for aarch64."""
        request = BuildImageRequest(
            job_id=job_id_value,
            stage_name="build-image",
            playbook_path=PlaybookPath("build_image_aarch64.yml"),
            extra_vars=ExtraVars(
                {
                    "job_id": job_id_value,
                    "image_key": ImageKey(image_key_value).value,
                    "functional_groups": list(functional_groups_value),
                    "inventory_host": inventory_host_value,
                }
            ),
            correlation_id="corr-456",
            timeout=ExecutionTimeout(60),
            submitted_at="2026-02-12T18:30:00.000Z",
            request_id="req-789",
            inventory_file_path=f"/path/to/inventory/{inventory_host_value}",
        )

        command = request.get_playbook_command()

        assert "ansible-playbook" in command
        assert "build_image_aarch64.yml" in command
        assert "-i" in command and inventory_host_value in command  # inventory_file_path based
        assert f'-e job_id="{job_id_value}"' in command
        assert f'-e image_key="{image_key_value}"' in command
        expected_groups = str(list(functional_groups_value))
        assert f"-e functional_groups='{expected_groups}'" in command

    def test_immutable(self, sample_request):
        """Test that BuildImageRequest is immutable."""
        with pytest.raises(AttributeError):
            sample_request.job_id = "new-job-id"

    def test_all_fields_required(self):
        """Test that all required fields must be provided."""
        with pytest.raises(TypeError):
            BuildImageRequest(
                job_id="job-123",
                # Missing other required fields
            )


================================================
FILE: build_stream/tests/unit/core/build_image/test_services.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for Build Image services."""

import pytest

from core.build_image.exceptions import InventoryHostMissingError
from core.build_image.repositories import BuildStreamConfigRepository
from core.build_image.services import (
    BuildImageConfigService,
    BuildImageQueueService,
)
from core.build_image.value_objects import Architecture, InventoryHost
from core.build_image.entities import BuildImageRequest
from core.localrepo.value_objects import (
    ExecutionTimeout,
    ExtraVars,
    PlaybookPath,
)


class MockBuildImageConfigRepository(BuildStreamConfigRepository):
    """Mock implementation of BuildStreamConfigRepository."""

    def __init__(self, inventory_host=None, should_fail=False):
        """Initialize mock with optional inventory host."""
        self.inventory_host = inventory_host
        self.should_fail = should_fail

    def get_aarch64_inv_host(self, job_id):
        """Return configured inventory host or None."""
        if self.should_fail:
            raise Exception("Config file error")
        return self.inventory_host


class MockBuildImageQueueRepository:
    """Mock implementation of PlaybookQueueRequestRepository."""

    def __init__(self, should_fail=False):
        """Initialize mock with optional failure mode."""
        self.submitted_requests = []
        self.should_fail = should_fail

    def write_request(self, request):
        """Store submitted request."""
        if self.should_fail:
            raise Exception("Queue error")
        self.submitted_requests.append(request)


class TestBuildImageConfigService:
    """Test cases for BuildImageConfigService."""

    def test_get_inventory_host_for_x86_64(self):
        """Test that x86_64 doesn't require inventory host."""
        config_repo = MockBuildImageConfigRepository()
        service = BuildImageConfigService(config_repo)
        
        result = service.get_inventory_host("job-123", Architecture("x86_64"), "corr-456")
        
        assert result is None

    def test_get_inventory_host_for_aarch64_success(self):
        """Test successful inventory host retrieval for aarch64."""
        config_repo = MockBuildImageConfigRepository(inventory_host="192.168.1.100")
        service = BuildImageConfigService(config_repo)
        
        result = service.get_inventory_host("job-123", Architecture("aarch64"), "corr-456")
        
        assert result is not None
        assert str(result) == "192.168.1.100"

    def test_get_inventory_host_for_aarch64_missing(self):
        """Test missing inventory host for aarch64."""
        config_repo = MockBuildImageConfigRepository()
        service = BuildImageConfigService(config_repo)
        
        with pytest.raises(InventoryHostMissingError) as exc_info:
            service.get_inventory_host("job-123", Architecture("aarch64"), "corr-456")
        
        assert "Inventory host is required for aarch64 builds" in str(exc_info.value)
        assert exc_info.value.correlation_id == "corr-456"

    def test_get_inventory_host_for_aarch64_config_error(self):
        """Test config error when retrieving inventory host."""
        config_repo = MockBuildImageConfigRepository(should_fail=True)
        service = BuildImageConfigService(config_repo)
        
        with pytest.raises(Exception):
            service.get_inventory_host("job-123", Architecture("aarch64"), "corr-456")


class TestBuildImageQueueService:
    """Test cases for BuildImageQueueService."""

    def test_submit_request_success(self):
        """Test successful request submission."""
        queue_repo = MockBuildImageQueueRepository()
        service = BuildImageQueueService(queue_repo)
        
        request = BuildImageRequest(
            job_id="job-123",
            stage_name="build-image",
            playbook_path=PlaybookPath("build_image_x86_64.yml"),
            extra_vars=ExtraVars({}),
            correlation_id="corr-456",
            timeout=ExecutionTimeout(60),
            submitted_at="2026-02-12T18:30:00.000Z",
            request_id="req-789",
        )
        
        service.submit_request(request, "corr-456")
        
        assert len(queue_repo.submitted_requests) == 1
        submitted_request = queue_repo.submitted_requests[0]
        assert submitted_request == request

    def test_submit_request_failure(self):
        """Test request submission failure."""
        queue_repo = MockBuildImageQueueRepository(should_fail=True)
        service = BuildImageQueueService(queue_repo)
        
        request = BuildImageRequest(
            job_id="job-123",
            stage_name="build-image",
            playbook_path=PlaybookPath("build_image_x86_64.yml"),
            extra_vars=ExtraVars({}),
            correlation_id="corr-456",
            timeout=ExecutionTimeout(60),
            submitted_at="2026-02-12T18:30:00.000Z",
            request_id="req-789",
        )
        
        # The service should let the exception bubble up
        with pytest.raises(Exception, match="Queue error"):
            service.submit_request(request, "corr-456")


================================================
FILE: build_stream/tests/unit/core/build_image/test_value_objects.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for Build Image value objects."""

import pytest

from core.build_image.value_objects import (
    Architecture,
    ImageKey,
    FunctionalGroups,
    InventoryHost,
)


class TestArchitecture:
    """Test cases for Architecture value object."""

    def test_valid_x86_64(self):
        """Test creating valid x86_64 architecture."""
        arch = Architecture("x86_64")
        assert str(arch) == "x86_64"
        assert arch.is_x86_64
        assert not arch.is_aarch64

    def test_valid_aarch64(self):
        """Test creating valid aarch64 architecture."""
        arch = Architecture("aarch64")
        assert str(arch) == "aarch64"
        assert arch.is_aarch64
        assert not arch.is_x86_64

    def test_invalid_empty(self):
        """Test that empty architecture raises ValueError."""
        with pytest.raises(ValueError, match="Architecture cannot be empty"):
            Architecture("")

    def test_invalid_whitespace(self):
        """Test that whitespace-only architecture raises ValueError."""
        with pytest.raises(ValueError, match="Architecture cannot be empty"):
            Architecture("   ")

    def test_unsupported_architecture(self):
        """Test that unsupported architecture raises ValueError."""
        with pytest.raises(ValueError, match="Unsupported architecture: arm64"):
            Architecture("arm64")

    def test_case_sensitive(self):
        """Test that architecture is case sensitive."""
        with pytest.raises(ValueError, match="Unsupported architecture: X86_64"):
            Architecture("X86_64")


class TestImageKey:
    """Test cases for ImageKey value object."""

    def test_valid_simple_key(self):
        """Test creating valid simple image key."""
        key = ImageKey("my-image")
        assert str(key) == "my-image"

    def test_valid_complex_key(self):
        """Test creating valid complex image key."""
        key = ImageKey("test_image_123-v2")
        assert str(key) == "test_image_123-v2"

    def test_valid_max_length(self):
        """Test creating image key with maximum allowed length."""
        key = ImageKey("a" * 128)
        assert len(str(key)) == 128

    def test_invalid_empty(self):
        """Test that empty image key raises ValueError."""
        with pytest.raises(ValueError, match="Image key cannot be empty"):
            ImageKey("")

    def test_invalid_too_long(self):
        """Test that too long image key raises ValueError."""
        with pytest.raises(ValueError, match="Image key length cannot exceed 128"):
            ImageKey("a" * 129)

    def test_invalid_characters(self):
        """Test that invalid characters raise ValueError."""
        with pytest.raises(ValueError, match="Invalid image key format"):
            ImageKey("my@image")

    def test_invalid_space(self):
        """Test that space in image key raises ValueError."""
        with pytest.raises(ValueError, match="Invalid image key format"):
            ImageKey("my image")


class TestFunctionalGroups:
    """Test cases for FunctionalGroups value object."""

    def test_valid_single_group(self):
        """Test creating valid single functional group."""
        groups = FunctionalGroups(["slurm_control_node"])
        assert groups.to_list() == ["slurm_control_node"]

    def test_valid_multiple_groups(self):
        """Test creating valid multiple functional groups."""
        groups = FunctionalGroups(["slurm_control_node", "slurm_node", "login_node"])
        assert groups.to_list() == ["slurm_control_node", "slurm_node", "login_node"]

    def test_valid_max_groups(self):
        """Test creating maximum allowed functional groups."""
        groups = FunctionalGroups([f"group_{i}" for i in range(50)])
        assert len(groups.to_list()) == 50

    def test_invalid_empty(self):
        """Test that empty functional groups raises ValueError."""
        with pytest.raises(ValueError, match="Functional groups cannot be empty"):
            FunctionalGroups([])

    def test_invalid_too_many(self):
        """Test that too many functional groups raises ValueError."""
        with pytest.raises(ValueError, match="Functional groups cannot exceed 50"):
            FunctionalGroups([f"group_{i}" for i in range(51)])

    def test_invalid_empty_group(self):
        """Test that empty group name raises ValueError."""
        with pytest.raises(ValueError, match="Functional group name cannot be empty"):
            FunctionalGroups(["valid_group", ""])

    def test_invalid_group_characters(self):
        """Test that invalid group characters raise ValueError."""
        with pytest.raises(ValueError, match="Invalid functional group name"):
            FunctionalGroups(["valid_group", "invalid@group"])

    def test_immutable_list(self):
        """Test that returned list is a copy."""
        groups = FunctionalGroups(["group1", "group2"])
        list_copy = groups.to_list()
        list_copy.append("group3")
        assert len(groups.to_list()) == 2


class TestInventoryHost:
    """Test cases for InventoryHost value object."""

    def test_valid_ip_address(self):
        """Test creating valid IP address."""
        host = InventoryHost("192.168.1.100")
        assert str(host) == "192.168.1.100"

    def test_valid_hostname(self):
        """Test creating valid hostname."""
        host = InventoryHost("node-01.example.com")
        assert str(host) == "node-01.example.com"

    def test_valid_max_length(self):
        """Test creating host with maximum allowed length."""
        host = InventoryHost("a" * 255)
        assert len(str(host)) == 255

    def test_invalid_empty(self):
        """Test that empty host raises ValueError."""
        with pytest.raises(ValueError, match="Inventory host cannot be empty"):
            InventoryHost("")

    def test_invalid_too_long(self):
        """Test that too long host raises ValueError."""
        with pytest.raises(ValueError, match="Inventory host length cannot exceed 255"):
            InventoryHost("a" * 256)

    def test_invalid_characters(self):
        """Test that invalid characters raise ValueError."""
        with pytest.raises(ValueError, match="Invalid inventory host format"):
            InventoryHost("192.168.1.100/24")

    def test_invalid_underscore(self):
        """Test that underscore in host raises ValueError."""
        with pytest.raises(ValueError, match="Invalid inventory host format"):
            InventoryHost("node_01.example.com")


================================================
FILE: build_stream/tests/unit/core/catalog/test_exceptions.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for Catalog domain exceptions."""

import pytest

from core.catalog.exceptions import (
    AdapterPolicyValidationError,
    CatalogParseError,
    CatalogSchemaValidationError,
    ConfigGenerationError,
    FileTooLargeError,
    InvalidFileFormatError,
    InvalidJSONError,
)


class TestCatalogParseError:
    """Tests for CatalogParseError base exception."""

    def test_base_error_with_message_only(self) -> None:
        error = CatalogParseError("Test message")
        assert error.message == "Test message"
        assert error.correlation_id is None
        assert str(error) == "Test message"

    def test_base_error_with_correlation_id(self) -> None:
        correlation_id = "018f3c4b-7b5b-7a9d-b6c4-9f3b4f9b2c10"
        error = CatalogParseError("Test message", correlation_id)
        assert error.message == "Test message"
        assert error.correlation_id == correlation_id
        assert str(error) == "Test message"

    def test_inheritance_from_exception(self) -> None:
        error = CatalogParseError("Test")
        assert isinstance(error, Exception)
        assert isinstance(error, CatalogParseError)


class TestInvalidFileFormatError:
    """Tests for InvalidFileFormatError."""

    def test_error_creation(self) -> None:
        error = InvalidFileFormatError("Invalid file format")
        assert isinstance(error, CatalogParseError)
        assert isinstance(error, Exception)
        assert str(error) == "Invalid file format"

    def test_error_with_correlation_id(self) -> None:
        correlation_id = "018f3c4b-7b5b-7a9d-b6c4-9f3b4f9b2c10"
        error = InvalidFileFormatError("Invalid format", correlation_id)
        assert error.correlation_id == correlation_id


class TestInvalidJSONError:
    """Tests for InvalidJSONError."""

    def test_error_creation(self) -> None:
        error = InvalidJSONError("Malformed JSON")
        assert isinstance(error, CatalogParseError)
        assert isinstance(error, Exception)
        assert str(error) == "Malformed JSON"

    def test_error_with_correlation_id(self) -> None:
        correlation_id = "018f3c4b-7b5b-7a9d-b6c4-9f3b4f9b2c10"
        error = InvalidJSONError("JSON error", correlation_id)
        assert error.correlation_id == correlation_id


class TestCatalogSchemaValidationError:
    """Tests for CatalogSchemaValidationError."""

    def test_error_with_message_only(self) -> None:
        error = CatalogSchemaValidationError("Schema validation failed")
        assert error.message == "Schema validation failed"
        assert error.schema_path == ""
        assert error.correlation_id is None
        assert isinstance(error, CatalogParseError)

    def test_error_with_schema_path(self) -> None:
        schema_path = "/path/to/schema.json"
        error = CatalogSchemaValidationError(
            "Validation failed",
            schema_path=schema_path
        )
        assert error.message == "Validation failed"
        assert error.schema_path == schema_path
        assert error.correlation_id is None

    def test_error_with_correlation_id(self) -> None:
        correlation_id = "018f3c4b-7b5b-7a9d-b6c4-9f3b4f9b2c10"
        error = CatalogSchemaValidationError(
            "Validation failed",
            correlation_id=correlation_id
        )
        assert error.correlation_id == correlation_id

    def test_error_with_all_parameters(self) -> None:
        correlation_id = "018f3c4b-7b5b-7a9d-b6c4-9f3b4f9b2c10"
        schema_path = "/path/to/schema.json"
        error = CatalogSchemaValidationError(
            "Validation failed",
            schema_path=schema_path,
            correlation_id=correlation_id
        )
        assert error.message == "Validation failed"
        assert error.schema_path == schema_path
        assert error.correlation_id == correlation_id


class TestFileTooLargeError:
    """Tests for FileTooLargeError."""

    def test_error_creation(self) -> None:
        error = FileTooLargeError(actual_size=5000, max_size=1000)
        assert error.actual_size == 5000
        assert error.max_size == 1000
        assert error.correlation_id is None
        assert "5000 bytes exceeds maximum 1000 bytes" in str(error)
        assert isinstance(error, CatalogParseError)

    def test_error_with_correlation_id(self) -> None:
        correlation_id = "018f3c4b-7b5b-7a9d-b6c4-9f3b4f9b2c10"
        error = FileTooLargeError(
            actual_size=5000,
            max_size=1000,
            correlation_id=correlation_id
        )
        assert error.correlation_id == correlation_id

    def test_error_message_format(self) -> None:
        error = FileTooLargeError(actual_size=1024, max_size=512)
        expected_msg = "File size 1024 bytes exceeds maximum 512 bytes"
        assert str(error) == expected_msg


class TestAdapterPolicyValidationError:
    """Tests for AdapterPolicyValidationError."""

    def test_error_with_message_only(self) -> None:
        error = AdapterPolicyValidationError("Policy validation failed")
        assert error.message == "Policy validation failed"
        assert error.policy_path == ""
        assert error.correlation_id is None
        assert isinstance(error, CatalogParseError)

    def test_error_with_policy_path(self) -> None:
        policy_path = "/path/to/policy.json"
        error = AdapterPolicyValidationError(
            "Validation failed",
            policy_path=policy_path
        )
        assert error.message == "Validation failed"
        assert error.policy_path == policy_path
        assert error.correlation_id is None

    def test_error_with_correlation_id(self) -> None:
        correlation_id = "018f3c4b-7b5b-7a9d-b6c4-9f3b4f9b2c10"
        error = AdapterPolicyValidationError(
            "Validation failed",
            correlation_id=correlation_id
        )
        assert error.correlation_id == correlation_id

    def test_error_with_all_parameters(self) -> None:
        correlation_id = "018f3c4b-7b5b-7a9d-b6c4-9f3b4f9b2c10"
        policy_path = "/path/to/policy.json"
        error = AdapterPolicyValidationError(
            "Validation failed",
            policy_path=policy_path,
            correlation_id=correlation_id
        )
        assert error.message == "Validation failed"
        assert error.policy_path == policy_path
        assert error.correlation_id == correlation_id


class TestConfigGenerationError:
    """Tests for ConfigGenerationError."""

    def test_error_creation(self) -> None:
        error = ConfigGenerationError("Config generation failed")
        assert isinstance(error, CatalogParseError)
        assert isinstance(error, Exception)
        assert str(error) == "Config generation failed"

    def test_error_with_correlation_id(self) -> None:
        correlation_id = "018f3c4b-7b5b-7a9d-b6c4-9f3b4f9b2c10"
        error = ConfigGenerationError("Generation failed", correlation_id)
        assert error.correlation_id == correlation_id


================================================
FILE: build_stream/tests/unit/core/catalog/test_generate_software_config.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for generate_software_config function."""

import json
import os
import tempfile

import pytest

from core.catalog.adapter_policy import generate_software_config
from core.catalog import adapter_policy_schema_consts as schema


# ---------------------------------------------------------------------------
# Helpers
# ---------------------------------------------------------------------------

def _read_output(output_dir: str) -> dict:
    """Read generated software_config.json from output_dir/input/."""
    path = os.path.join(output_dir, "input", "software_config.json")
    assert os.path.isfile(path), f"Expected file not found: {path}"
    with open(path, "r", encoding="utf-8") as f:
        return json.load(f)


def _software_by_name(result: dict, name: str) -> dict:
    """Find a software entry by name in the softwares list."""
    matches = [s for s in result["softwares"] if s["name"] == name]
    assert len(matches) == 1, f"Expected exactly 1 entry for '{name}', got {len(matches)}"
    return matches[0]


# ---------------------------------------------------------------------------
# Static fields
# ---------------------------------------------------------------------------

class TestStaticFields:
    """Tests for static / catalog-derived fields."""

    def test_cluster_os_type_from_os_family(self, tmp_path: str) -> None:
        configs = {"x86_64": {"pkg.json": {"pkg": {schema.CLUSTER: [{"package": "a"}]}}}}
        generate_software_config(
            output_dir=str(tmp_path), os_family="rhel", os_version="10.0",
            all_arch_target_configs=configs,
        )
        result = _read_output(str(tmp_path))
        assert result["cluster_os_type"] == "rhel"

    def test_cluster_os_version_from_os_version(self, tmp_path: str) -> None:
        configs = {"x86_64": {"pkg.json": {"pkg": {schema.CLUSTER: [{"package": "a"}]}}}}
        generate_software_config(
            output_dir=str(tmp_path), os_family="rhel", os_version="10.0",
            all_arch_target_configs=configs,
        )
        result = _read_output(str(tmp_path))
        assert result["cluster_os_version"] == "10.0"

    def test_repo_config_is_partial(self, tmp_path: str) -> None:
        configs = {"x86_64": {"pkg.json": {"pkg": {schema.CLUSTER: [{"package": "a"}]}}}}
        generate_software_config(
            output_dir=str(tmp_path), os_family="rhel", os_version="10.0",
            all_arch_target_configs=configs,
        )
        result = _read_output(str(tmp_path))
        assert result["repo_config"] == "always"


# ---------------------------------------------------------------------------
# Softwares list — basic
# ---------------------------------------------------------------------------

class TestSoftwaresList:
    """Tests for the softwares list generation."""

    def test_single_arch_single_target(self, tmp_path: str) -> None:
        configs = {
            "x86_64": {
                "openldap.json": {
                    "openldap": {schema.CLUSTER: [{"package": "openldap-clients"}]}
                }
            }
        }
        generate_software_config(
            output_dir=str(tmp_path), os_family="rhel", os_version="10.0",
            all_arch_target_configs=configs,
        )
        result = _read_output(str(tmp_path))
        entry = _software_by_name(result, "openldap")
        assert entry["arch"] == ["x86_64"]
        assert "version" not in entry

    def test_multi_arch_both_non_empty(self, tmp_path: str) -> None:
        configs = {
            "x86_64": {"openldap.json": {"openldap": {schema.CLUSTER: [{"package": "a"}]}}},
            "aarch64": {"openldap.json": {"openldap": {schema.CLUSTER: [{"package": "b"}]}}},
        }
        generate_software_config(
            output_dir=str(tmp_path), os_family="rhel", os_version="10.0",
            all_arch_target_configs=configs,
        )
        entry = _software_by_name(_read_output(str(tmp_path)), "openldap")
        assert "x86_64" in entry["arch"]
        assert "aarch64" in entry["arch"]

    def test_target_name_derived_from_filename(self, tmp_path: str) -> None:
        configs = {
            "x86_64": {"my_custom.json": {"my_custom": {schema.CLUSTER: [{"package": "x"}]}}}
        }
        generate_software_config(
            output_dir=str(tmp_path), os_family="rhel", os_version="10.0",
            all_arch_target_configs=configs,
        )
        names = [s["name"] for s in _read_output(str(tmp_path))["softwares"]]
        assert "my_custom" in names


# ---------------------------------------------------------------------------
# Arch exclusion when all subgroups empty
# ---------------------------------------------------------------------------

class TestArchExclusion:
    """Tests for excluding arches with all-empty cluster arrays."""

    def test_excludes_arch_when_all_subgroups_empty(self, tmp_path: str) -> None:
        configs = {
            "x86_64": {"csi_driver_powerscale.json": {
                "csi_driver_powerscale": {schema.CLUSTER: [{"package": "csi-powerscale"}]}
            }},
            "aarch64": {"csi_driver_powerscale.json": {
                "csi_driver_powerscale": {schema.CLUSTER: []}
            }},
        }
        generate_software_config(
            output_dir=str(tmp_path), os_family="rhel", os_version="10.0",
            all_arch_target_configs=configs,
        )
        entry = _software_by_name(_read_output(str(tmp_path)), "csi_driver_powerscale")
        assert entry["arch"] == ["x86_64"]

    def test_excludes_target_entirely_when_empty_on_all_arches(self, tmp_path: str) -> None:
        configs = {
            "x86_64": {"csi_driver_powerscale.json": {
                "csi_driver_powerscale": {schema.CLUSTER: []}
            }},
            "aarch64": {"csi_driver_powerscale.json": {
                "csi_driver_powerscale": {schema.CLUSTER: []}
            }},
        }
        generate_software_config(
            output_dir=str(tmp_path), os_family="rhel", os_version="10.0",
            all_arch_target_configs=configs,
        )
        names = [s["name"] for s in _read_output(str(tmp_path))["softwares"]]
        assert "csi_driver_powerscale" not in names

    def test_target_missing_from_arch_excluded(self, tmp_path: str) -> None:
        configs = {
            "x86_64": {"service_k8s.json": {
                "service_kube_control_plane": {schema.CLUSTER: [{"package": "kubectl"}]},
                "service_k8s": {schema.CLUSTER: [{"package": "kubeadm"}]},
            }},
            "aarch64": {},
        }
        generate_software_config(
            output_dir=str(tmp_path), os_family="rhel", os_version="10.0",
            all_arch_target_configs=configs,
        )
        entry = _software_by_name(_read_output(str(tmp_path)), "service_k8s")
        assert entry["arch"] == ["x86_64"]


# ---------------------------------------------------------------------------
# Version strings
# ---------------------------------------------------------------------------

class TestVersionStrings:
    """Tests for static version injection."""

    def test_service_k8s_gets_version(self, tmp_path: str) -> None:
        configs = {"x86_64": {"service_k8s.json": {
            "service_kube_control_plane": {schema.CLUSTER: [{"package": "kubectl"}]},
            "service_k8s": {schema.CLUSTER: [{"package": "kubeadm"}]},
        }}}
        generate_software_config(
            output_dir=str(tmp_path), os_family="rhel", os_version="10.0",
            all_arch_target_configs=configs,
        )
        entry = _software_by_name(_read_output(str(tmp_path)), "service_k8s")
        assert entry["version"] == "1.34.1"

    def test_csi_target_gets_version(self, tmp_path: str) -> None:
        configs = {"x86_64": {"csi_driver_powerscale.json": {
            "csi_driver_powerscale": {schema.CLUSTER: [{"package": "csi-powerscale"}]}
        }}}
        generate_software_config(
            output_dir=str(tmp_path), os_family="rhel", os_version="10.0",
            all_arch_target_configs=configs,
        )
        entry = _software_by_name(_read_output(str(tmp_path)), "csi_driver_powerscale")
        assert entry["version"] == "v2.15.0"

    def test_regular_target_has_no_version(self, tmp_path: str) -> None:
        configs = {"x86_64": {"openldap.json": {
            "openldap": {schema.CLUSTER: [{"package": "openldap-clients"}]}
        }}}
        generate_software_config(
            output_dir=str(tmp_path), os_family="rhel", os_version="10.0",
            all_arch_target_configs=configs,
        )
        entry = _software_by_name(_read_output(str(tmp_path)), "openldap")
        assert "version" not in entry


# ---------------------------------------------------------------------------
# Subgroup sections
# ---------------------------------------------------------------------------

class TestSubgroupSections:
    """Tests for subgroup (role) sections in the output."""

    def test_lists_non_empty_subgroups(self, tmp_path: str) -> None:
        configs = {"x86_64": {"slurm_custom.json": {
            "slurm_control_node": {schema.CLUSTER: [{"package": "slurmctld"}]},
            "slurm_node": {schema.CLUSTER: [{"package": "slurmd"}]},
            "login_node": {schema.CLUSTER: [{"package": "slurm"}]},
            "slurm_custom": {schema.CLUSTER: [{"package": "munge"}]},
        }}}
        generate_software_config(
            output_dir=str(tmp_path), os_family="rhel", os_version="10.0",
            all_arch_target_configs=configs,
        )
        result = _read_output(str(tmp_path))
        assert "slurm_custom" in result
        sub_names = {e["name"] for e in result["slurm_custom"]}
        assert sub_names == {"slurm_control_node", "slurm_node", "login_node"}

    def test_target_name_not_in_subgroups(self, tmp_path: str) -> None:
        configs = {"x86_64": {"slurm_custom.json": {
            "slurm_control_node": {schema.CLUSTER: [{"package": "slurmctld"}]},
            "slurm_custom": {schema.CLUSTER: [{"package": "munge"}]},
        }}}
        generate_software_config(
            output_dir=str(tmp_path), os_family="rhel", os_version="10.0",
            all_arch_target_configs=configs,
        )
        sub_names = {e["name"] for e in _read_output(str(tmp_path))["slurm_custom"]}
        assert "slurm_custom" not in sub_names

    def test_excludes_empty_cluster_subgroups(self, tmp_path: str) -> None:
        configs = {"x86_64": {"service_k8s.json": {
            "service_kube_control_plane": {schema.CLUSTER: [{"package": "kubectl"}]},
            "service_kube_node": {schema.CLUSTER: []},
            "service_k8s": {schema.CLUSTER: [{"package": "kubeadm"}]},
        }}}
        generate_software_config(
            output_dir=str(tmp_path), os_family="rhel", os_version="10.0",
            all_arch_target_configs=configs,
        )
        sub_names = {e["name"] for e in _read_output(str(tmp_path))["service_k8s"]}
        assert "service_kube_control_plane" in sub_names
        assert "service_kube_node" not in sub_names

    def test_no_subgroup_section_for_single_role_target(self, tmp_path: str) -> None:
        configs = {"x86_64": {"openldap.json": {
            "openldap": {schema.CLUSTER: [{"package": "openldap-clients"}]}
        }}}
        generate_software_config(
            output_dir=str(tmp_path), os_family="rhel", os_version="10.0",
            all_arch_target_configs=configs,
        )
        result = _read_output(str(tmp_path))
        assert "openldap" not in result

    def test_subgroups_merged_across_arches(self, tmp_path: str) -> None:
        configs = {
            "x86_64": {"slurm_custom.json": {
                "slurm_control_node": {schema.CLUSTER: [{"package": "slurmctld"}]},
                "slurm_node": {schema.CLUSTER: [{"package": "slurmd"}]},
                "slurm_custom": {schema.CLUSTER: [{"package": "munge"}]},
            }},
            "aarch64": {"slurm_custom.json": {
                "slurm_node": {schema.CLUSTER: [{"package": "slurmd"}]},
                "login_node": {schema.CLUSTER: [{"package": "slurm"}]},
                "slurm_custom": {schema.CLUSTER: [{"package": "munge"}]},
            }},
        }
        generate_software_config(
            output_dir=str(tmp_path), os_family="rhel", os_version="10.0",
            all_arch_target_configs=configs,
        )
        sub_names = {e["name"] for e in _read_output(str(tmp_path))["slurm_custom"]}
        assert sub_names == {"slurm_control_node", "slurm_node", "login_node"}


# ---------------------------------------------------------------------------
# Edge cases
# ---------------------------------------------------------------------------

class TestEdgeCases:
    """Tests for edge cases."""

    def test_empty_all_arch_configs(self, tmp_path: str) -> None:
        generate_software_config(
            output_dir=str(tmp_path), os_family="rhel", os_version="10.0",
            all_arch_target_configs={},
        )
        result = _read_output(str(tmp_path))
        assert result["softwares"] == []
        assert result["cluster_os_type"] == "rhel"
        assert result["cluster_os_version"] == "10.0"
        assert result["repo_config"] == "always"

    def test_creates_output_directory(self, tmp_path: str) -> None:
        output_dir = os.path.join(str(tmp_path), "deep", "nested", "output")
        configs = {"x86_64": {"pkg.json": {"pkg": {schema.CLUSTER: [{"package": "a"}]}}}}
        generate_software_config(
            output_dir=output_dir, os_family="rhel", os_version="10.0",
            all_arch_target_configs=configs,
        )
        path = os.path.join(output_dir, "input", "software_config.json")
        assert os.path.isfile(path)


# ---------------------------------------------------------------------------
# Realistic scenario
# ---------------------------------------------------------------------------

class TestRealisticScenario:
    """End-to-end-style test matching real project_default/software_config.json."""

    def test_realistic_multi_target(self, tmp_path: str) -> None:
        configs = {
            "x86_64": {
                "default_packages.json": {
                    "default_packages": {schema.CLUSTER: [{"package": "systemd"}]}
                },
                "slurm_custom.json": {
                    "slurm_control_node": {schema.CLUSTER: [{"package": "slurmctld"}]},
                    "slurm_node": {schema.CLUSTER: [{"package": "slurmd"}]},
                    "login_node": {schema.CLUSTER: [{"package": "slurm"}]},
                    "login_compiler_node": {schema.CLUSTER: [{"package": "slurmd"}]},
                    "slurm_custom": {schema.CLUSTER: [{"package": "munge"}]},
                },
                "service_k8s.json": {
                    "service_kube_control_plane_first": {schema.CLUSTER: [{"package": "kubeadm"}]},
                    "service_kube_control_plane": {schema.CLUSTER: [{"package": "kubectl"}]},
                    "service_kube_node": {schema.CLUSTER: [{"package": "kubelet"}]},
                    "service_k8s": {schema.CLUSTER: [{"package": "cri-o"}]},
                },
                "csi_driver_powerscale.json": {
                    "csi_driver_powerscale": {schema.CLUSTER: [{"package": "csi-powerscale"}]}
                },
            },
            "aarch64": {
                "default_packages.json": {
                    "default_packages": {schema.CLUSTER: [{"package": "systemd"}]}
                },
                "slurm_custom.json": {
                    "slurm_control_node": {schema.CLUSTER: [{"package": "slurmctld"}]},
                    "slurm_node": {schema.CLUSTER: [{"package": "slurmd"}]},
                    "login_node": {schema.CLUSTER: [{"package": "slurm"}]},
                    "login_compiler_node": {schema.CLUSTER: [{"package": "slurmd"}]},
                    "slurm_custom": {schema.CLUSTER: [{"package": "munge"}]},
                },
                "service_k8s.json": {
                    "service_kube_control_plane_first": {schema.CLUSTER: []},
                    "service_kube_control_plane": {schema.CLUSTER: []},
                    "service_kube_node": {schema.CLUSTER: []},
                    "service_k8s": {schema.CLUSTER: [{"package": "firewalld"}]},
                },
                "csi_driver_powerscale.json": {
                    "csi_driver_powerscale": {schema.CLUSTER: []}
                },
            },
        }
        generate_software_config(
            output_dir=str(tmp_path), os_family="rhel", os_version="10.0",
            all_arch_target_configs=configs,
        )
        result = _read_output(str(tmp_path))

        # default_packages: both arches
        dp = _software_by_name(result, "default_packages")
        assert "x86_64" in dp["arch"]
        assert "aarch64" in dp["arch"]
        assert "version" not in dp

        # slurm_custom: both arches
        sc = _software_by_name(result, "slurm_custom")
        assert "x86_64" in sc["arch"]
        assert "aarch64" in sc["arch"]

        # service_k8s: both arches (aarch64 service_k8s itself has packages)
        k8s = _software_by_name(result, "service_k8s")
        assert "x86_64" in k8s["arch"]
        assert "aarch64" in k8s["arch"]
        assert k8s["version"] == "1.34.1"

        # csi_driver_powerscale: x86_64 only
        csi = _software_by_name(result, "csi_driver_powerscale")
        assert csi["arch"] == ["x86_64"]
        assert csi["version"] == "v2.15.0"

        # slurm_custom subgroups
        assert "slurm_custom" in result
        sc_subs = {e["name"] for e in result["slurm_custom"]}
        assert sc_subs == {"slurm_control_node", "slurm_node", "login_node", "login_compiler_node"}

        # service_k8s subgroups (only non-empty ones across all arches)
        assert "service_k8s" in result
        k8s_subs = {e["name"] for e in result["service_k8s"]}
        assert "service_kube_control_plane_first" in k8s_subs
        assert "service_kube_control_plane" in k8s_subs
        assert "service_kube_node" in k8s_subs


================================================
FILE: build_stream/tests/unit/core/catalog/test_parser.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for Catalog parser."""

import json
import os
import tempfile
from jsonschema import ValidationError
from pathlib import Path
from unittest.mock import patch, MagicMock

import pytest

from core.catalog.parser import ParseCatalog, _DEFAULT_SCHEMA_PATH


class TestParseCatalog:
    """Tests for ParseCatalog function."""

    def test_parse_valid_catalog_with_default_schema(self) -> None:
        """Test parsing a valid catalog using the default schema."""
        # Create a minimal valid catalog
        catalog_data = {
            "Catalog": {
                "Name": "Test Catalog",
                "Version": "1.0.0",
                "FunctionalLayer": "test-functional",
                "BaseOS": "test-os",
                "Infrastructure": "test-infra",
                "FunctionalPackages": {
                    "pkg1": {
                        "Name": "Test Package",
                        "Type": "test",
                        "Architecture": "x86_64",
                        "SupportedOS": [{"Name": "Ubuntu", "Version": "20.04"}]
                    }
                },
                "OSPackages": {},
                "InfrastructurePackages": {},
                "DriverPackages": {}
            }
        }

        with tempfile.NamedTemporaryFile(mode='w', suffix='.json', delete=False) as f:
            json.dump(catalog_data, f)
            catalog_path = f.name

        try:
            # Mock the schema loading to avoid dependency on actual schema file
            mock_schema = {"type": "object", "properties": {"Catalog": {"type": "object"}}}
            
            with patch('core.catalog.parser.load_json_file') as mock_load:
                # Configure mock to return schema for schema_path and catalog data for catalog_path
                def load_side_effect(path):
                    if path == _DEFAULT_SCHEMA_PATH:
                        return mock_schema
                    elif path == catalog_path:
                        return catalog_data
                    else:
                        raise FileNotFoundError(f"Unexpected path: {path}")
                
                mock_load.side_effect = load_side_effect
                
                result = ParseCatalog(catalog_path)
                
                # The function should return some object (we don't need to check the exact type)
                assert result is not None
                
        finally:
            os.unlink(catalog_path)

    def test_parse_catalog_with_custom_schema(self) -> None:
        """Test parsing a catalog with a custom schema path."""
        catalog_data = {
            "Catalog": {
                "Name": "Test Catalog",
                "Version": "1.0.0",
                "FunctionalLayer": "test-functional",
                "BaseOS": "test-os",
                "Infrastructure": "test-infra",
                "FunctionalPackages": {},
                "OSPackages": {},
                "InfrastructurePackages": {},
                "DriverPackages": {}
            }
        }

        with tempfile.NamedTemporaryFile(mode='w', suffix='.json', delete=False) as f:
            json.dump(catalog_data, f)
            catalog_path = f.name

        custom_schema_path = "/path/to/custom/schema.json"
        mock_schema = {"type": "object", "properties": {"Catalog": {"type": "object"}}}

        try:
            with patch('core.catalog.parser.load_json_file') as mock_load:
                def load_side_effect(path):
                    if path == custom_schema_path:
                        return mock_schema
                    elif path == catalog_path:
                        return catalog_data
                    else:
                        raise FileNotFoundError(f"Unexpected path: {path}")
                
                mock_load.side_effect = load_side_effect
                
                result = ParseCatalog(catalog_path, custom_schema_path)
                
                # The function should return some object
                assert result is not None
                
        finally:
            os.unlink(catalog_path)

    def test_parse_catalog_validation_error_raises_exception(self) -> None:
        """Test that invalid catalog raises ValidationError."""
        # Create an invalid catalog (missing required fields)
        invalid_catalog_data = {"Catalog": {"Name": "Invalid Catalog"}}

        with tempfile.NamedTemporaryFile(mode='w', suffix='.json', delete=False) as f:
            json.dump(invalid_catalog_data, f)
            catalog_path = f.name

        # Create a schema that requires more fields
        mock_schema = {
            "type": "object",
            "properties": {
                "Catalog": {
                    "type": "object",
                    "required": ["Name", "Version", "FunctionalLayer", "BaseOS", "Infrastructure"],
                    "properties": {
                        "Name": {"type": "string"},
                        "Version": {"type": "string"},
                        "FunctionalLayer": {"type": "string"},
                        "BaseOS": {"type": "string"},
                        "Infrastructure": {"type": "string"}
                    }
                }
            }
        }

        try:
            with patch('core.catalog.parser.load_json_file') as mock_load:
                def load_side_effect(path):
                    if path == _DEFAULT_SCHEMA_PATH:
                        return mock_schema
                    elif path == catalog_path:
                        return invalid_catalog_data
                    else:
                        raise FileNotFoundError(f"Unexpected path: {path}")
                
                mock_load.side_effect = load_side_effect
                
                with pytest.raises(ValidationError):
                    ParseCatalog(catalog_path)
                    
        finally:
            os.unlink(catalog_path)

    def test_parse_catalog_with_all_package_types(self) -> None:
        """Test parsing catalog with all types of packages."""
        catalog_data = {
            "Catalog": {
                "Name": "Full Catalog",
                "Version": "1.0.0",
                "FunctionalLayer": "test-functional",
                "BaseOS": "test-os",
                "Infrastructure": "test-infra",
                "Drivers": ["test-driver"],
                "FunctionalPackages": {
                    "func1": {
                        "Name": "Functional Package",
                        "Type": "functional",
                        "Architecture": "x86_64",
                        "SupportedOS": [{"Name": "Ubuntu", "Version": "20.04"}],
                        "Version": "1.0",
                        "Tag": "test-tag",
                        "Sources": ["source1"]
                    }
                },
                "OSPackages": {
                    "os1": {
                        "Name": "OS Package",
                        "Type": "os",
                        "Architecture": "x86_64",
                        "SupportedOS": [{"Name": "Ubuntu", "Version": "20.04"}],
                        "Version": "1.0",
                        "Tag": "os-tag",
                        "Sources": ["os-source"]
                    }
                },
                "InfrastructurePackages": {
                    "infra1": {
                        "Name": "Infrastructure Package",
                        "Type": "infrastructure",
                        "Version": "1.0",
                        "Uri": "http://example.com/infra",
                        "Architecture": ["x86_64", "arm64"],
                        "SupportedFunctions": {"function1": "value1"},
                        "Tag": "infra-tag",
                        "Sources": ["infra-source"]
                    }
                },
                "DriverPackages": {
                    "drv1": {
                        "Name": "Driver Package",
                        "Version": "1.0",
                        "Uri": "http://example.com/driver",
                        "Architecture": "x86_64",
                        "Config": {"param1": "value1"},
                        "Type": "driver"
                    }
                },
                "Miscellaneous": ["misc1", "misc2"]
            }
        }

        with tempfile.NamedTemporaryFile(mode='w', suffix='.json', delete=False) as f:
            json.dump(catalog_data, f)
            catalog_path = f.name

        mock_schema = {"type": "object", "properties": {"Catalog": {"type": "object"}}}

        try:
            with patch('core.catalog.parser.load_json_file') as mock_load:
                def load_side_effect(path):
                    if path == _DEFAULT_SCHEMA_PATH:
                        return mock_schema
                    elif path == catalog_path:
                        return catalog_data
                    else:
                        raise FileNotFoundError(f"Unexpected path: {path}")
                
                mock_load.side_effect = load_side_effect
                
                result = ParseCatalog(catalog_path)
                
                # The function should return some object
                assert result is not None
                
        finally:
            os.unlink(catalog_path)

    def test_parse_catalog_missing_optional_sections(self) -> None:
        """Test parsing catalog with missing optional sections."""
        catalog_data = {
            "Catalog": {
                "Name": "Minimal Catalog",
                "Version": "1.0.0",
                "FunctionalLayer": "test-functional",
                "BaseOS": "test-os",
                "Infrastructure": "test-infra",
                "FunctionalPackages": {},
                "OSPackages": {},
                "InfrastructurePackages": {}
                # No DriverPackages, Drivers, or Miscellaneous
            }
        }

        with tempfile.NamedTemporaryFile(mode='w', suffix='.json', delete=False) as f:
            json.dump(catalog_data, f)
            catalog_path = f.name

        mock_schema = {"type": "object", "properties": {"Catalog": {"type": "object"}}}

        try:
            with patch('core.catalog.parser.load_json_file') as mock_load:
                def load_side_effect(path):
                    if path == _DEFAULT_SCHEMA_PATH:
                        return mock_schema
                    elif path == catalog_path:
                        return catalog_data
                    else:
                        raise FileNotFoundError(f"Unexpected path: {path}")
                
                mock_load.side_effect = load_side_effect
                
                result = ParseCatalog(catalog_path)
                
                # The function should return some object
                assert result is not None
                
        finally:
            os.unlink(catalog_path)


================================================
FILE: build_stream/tests/unit/core/catalog/test_parser_defaults.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import os
import sys
import pytest

HERE = os.path.dirname(__file__)
PROJECT_ROOT = os.path.dirname(os.path.dirname(os.path.dirname(os.path.dirname(HERE))))  # Go up 4 levels to reach build_stream root
if PROJECT_ROOT not in sys.path:
    sys.path.insert(0, PROJECT_ROOT)

from core.catalog.parser import ParseCatalog, _DEFAULT_SCHEMA_PATH


class TestParseCatalogDefaults:
    def test_default_schema_path_points_to_resources(self):
        # The default schema path should point to the actual resources directory in core/catalog
        expected_schema = os.path.join(PROJECT_ROOT, "core", "catalog", "resources", "CatalogSchema.json")
        assert os.path.abspath(_DEFAULT_SCHEMA_PATH) == os.path.abspath(expected_schema)

    def test_parse_catalog_with_explicit_paths_uses_fixture(self):
        # Use the fixtures directory for test data
        fixtures_dir = os.path.join(PROJECT_ROOT, "tests", "fixtures", "catalogs")
        catalog_path = os.path.join(fixtures_dir, "catalog_rhel.json")
        schema_path = os.path.join(PROJECT_ROOT, "core", "catalog", "resources", "CatalogSchema.json")

        # Skip test if fixtures don't exist
        if not os.path.exists(catalog_path) or not os.path.exists(schema_path):
            pytest.skip("Test fixtures not found")

        catalog = ParseCatalog(catalog_path, schema_path)
        assert len(catalog.functional_packages) > 0


================================================
FILE: build_stream/tests/unit/core/jobs/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for core.jobs domain layer."""


================================================
FILE: build_stream/tests/unit/core/jobs/entities/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Test configuration for job entities."""


================================================
FILE: build_stream/tests/unit/core/jobs/entities/conftest.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Shared fixtures and utilities for entity tests."""

import pytest
from datetime import datetime, timezone

from build_stream.core.jobs.value_objects import JobId, ClientId, CorrelationId


@pytest.fixture
def sample_job_id():
    """Sample job ID for testing."""
    return JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11")


@pytest.fixture
def sample_client_id():
    """Sample client ID for testing."""
    return ClientId("client-1")


@pytest.fixture
def sample_correlation_id():
    """Sample correlation ID for testing."""
    return CorrelationId("018f3c4b-2d9e-7d1a-8a2b-111111111111")


@pytest.fixture
def sample_timestamp():
    """Sample timestamp for testing."""
    return datetime.now(timezone.utc)


================================================
FILE: build_stream/tests/unit/core/jobs/entities/test_audit.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for AuditEvent entity."""

from datetime import datetime, timezone

import pytest

from build_stream.core.jobs.entities.audit import AuditEvent
from build_stream.core.jobs.value_objects import ClientId, CorrelationId, JobId


class TestAuditEvent:
    """Tests for AuditEvent entity."""

    def test_create_event(self):
        """AuditEvent should be immutable."""
        event = AuditEvent(
            event_id="evt-123",
            job_id=JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11"),
            event_type="JOB_CREATED",
            correlation_id=CorrelationId("018f3c4b-2d9e-7d1a-8a2b-111111111111"),
            client_id=ClientId("client-1"),
            timestamp=datetime.now(timezone.utc),
        )
        assert event.event_type == "JOB_CREATED"
        assert event.details == {}

    def test_event_with_details(self):
        """AuditEvent should support additional details."""
        event = AuditEvent(
            event_id="evt-123",
            job_id=JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11"),
            event_type="STAGE_COMPLETED",
            correlation_id=CorrelationId("018f3c4b-2d9e-7d1a-8a2b-111111111111"),
            client_id=ClientId("client-1"),
            timestamp=datetime.now(timezone.utc),
            details={"stage_name": "parse-catalog", "duration_ms": 1500},
        )
        assert event.details["stage_name"] == "parse-catalog"
        assert event.details["duration_ms"] == 1500

    def test_event_immutability(self):
        """AuditEvent should be frozen."""
        event = AuditEvent(
            event_id="evt-123",
            job_id=JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11"),
            event_type="JOB_CREATED",
            correlation_id=CorrelationId("018f3c4b-2d9e-7d1a-8a2b-111111111111"),
            client_id=ClientId("client-1"),
            timestamp=datetime.now(timezone.utc),
        )
        with pytest.raises(AttributeError):
            event.event_type = "JOB_UPDATED"


================================================
FILE: build_stream/tests/unit/core/jobs/entities/test_idempotency.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for IdempotencyRecord entity."""

from datetime import datetime, timedelta

import pytest

from build_stream.core.jobs.entities.idempotency import IdempotencyRecord
from build_stream.core.jobs.value_objects import ClientId, IdempotencyKey, JobId, RequestFingerprint


class TestIdempotencyRecord:
    """Tests for IdempotencyRecord entity."""

    def test_create_record(self):
        """IdempotencyRecord should be immutable."""
        now = datetime.now()
        record = IdempotencyRecord(
            idempotency_key=IdempotencyKey("key-123"),
            job_id=JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11"),
            request_fingerprint=RequestFingerprint("a" * 64),
            client_id=ClientId("client-1"),
            created_at=now,
            expires_at=now + timedelta(hours=1),
        )
        assert record.idempotency_key.value == "key-123"
        assert record.job_id.value == "018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11"

    def test_record_immutability(self):
        """IdempotencyRecord should be frozen."""
        now = datetime.now()
        record = IdempotencyRecord(
            idempotency_key=IdempotencyKey("key-123"),
            job_id=JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11"),
            request_fingerprint=RequestFingerprint("a" * 64),
            client_id=ClientId("client-1"),
            created_at=now,
            expires_at=now + timedelta(hours=1),
        )
        with pytest.raises(AttributeError):
            record.job_id = JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a12")

    def test_is_expired(self):
        """Record should correctly detect expiration."""
        now = datetime.now()
        record = IdempotencyRecord(
            idempotency_key=IdempotencyKey("key-123"),
            job_id=JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11"),
            request_fingerprint=RequestFingerprint("a" * 64),
            client_id=ClientId("client-1"),
            created_at=now,
            expires_at=now + timedelta(hours=1),
        )
        assert record.is_expired(now) is False
        assert record.is_expired(now + timedelta(hours=2)) is True

    def test_matches_fingerprint(self):
        """Record should correctly match fingerprints."""
        now = datetime.now()
        fingerprint = RequestFingerprint("a" * 64)
        record = IdempotencyRecord(
            idempotency_key=IdempotencyKey("key-123"),
            job_id=JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11"),
            request_fingerprint=fingerprint,
            client_id=ClientId("client-1"),
            created_at=now,
            expires_at=now + timedelta(hours=1),
        )
        assert record.matches_fingerprint(fingerprint) is True
        assert record.matches_fingerprint(RequestFingerprint("b" * 64)) is False


================================================
FILE: build_stream/tests/unit/core/jobs/entities/test_job.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for Job entity."""

import pytest

from build_stream.core.jobs.entities.job import Job
from build_stream.core.jobs.exceptions import (
    InvalidStateTransitionError,
    TerminalStateViolationError,
)
from build_stream.core.jobs.value_objects import ClientId, JobId, JobState


class TestJob:
    """Tests for Job entity."""

    def test_create_job(self):
        """Job should be created with initial state."""
        job = Job(
            job_id=JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11"),
            client_id=ClientId("client-1"),
            request_client_id="req-client-123",
            client_name="abc123",
        )
        assert job.job_state == JobState.CREATED
        assert job.version == 1
        assert job.tombstoned is False

    def test_start_job(self):
        """Job should transition from CREATED to IN_PROGRESS."""
        job = Job(
            job_id=JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11"),
            client_id=ClientId("client-1"),
            request_client_id="req-client-123",
            client_name="abc123",
        )
        job.start()
        assert job.job_state == JobState.IN_PROGRESS
        assert job.version == 2

    def test_start_job_invalid_state(self):
        """Starting job from non-CREATED state should fail."""
        job = Job(
            job_id=JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11"),
            client_id=ClientId("client-1"),
            request_client_id="req-client-123",
            job_state=JobState.IN_PROGRESS,
            client_name="abc123",
        )
        with pytest.raises(InvalidStateTransitionError):
            job.start()

    def test_complete_job(self):
        """Job should transition from IN_PROGRESS to COMPLETED."""
        job = Job(
            job_id=JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11"),
            client_id=ClientId("client-1"),
            request_client_id="req-client-123",
            job_state=JobState.IN_PROGRESS,
            client_name="abc123",
        )
        job.complete()
        assert job.job_state == JobState.COMPLETED
        assert job.version == 2

    def test_complete_job_invalid_state(self):
        """Completing job from non-IN_PROGRESS state should fail."""
        job = Job(
            job_id=JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11"),
            client_id=ClientId("client-1"),
            request_client_id="req-client-123",
            client_name="abc123",
        )
        with pytest.raises(InvalidStateTransitionError):
            job.complete()

    def test_fail_job(self):
        """Job should transition from IN_PROGRESS to FAILED."""
        job = Job(
            job_id=JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11"),
            client_id=ClientId("client-1"),
            request_client_id="req-client-123",
            job_state=JobState.IN_PROGRESS,
            client_name="abc123",
        )
        job.fail()
        assert job.job_state == JobState.FAILED
        assert job.version == 2

    def test_cancel_job_from_created(self):
        """Job should be cancellable from CREATED state."""
        job = Job(
            job_id=JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11"),
            client_id=ClientId("client-1"),
            request_client_id="req-client-123",
            client_name="abc123",
        )
        job.cancel()
        assert job.job_state == JobState.CANCELLED
        assert job.version == 2

    def test_cancel_job_from_in_progress(self):
        """Job should be cancellable from IN_PROGRESS state."""
        job = Job(
            job_id=JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11"),
            client_id=ClientId("client-1"),
            request_client_id="req-client-123",
            job_state=JobState.IN_PROGRESS,
            client_name="abc123",
        )
        job.cancel()
        assert job.job_state == JobState.CANCELLED

    def test_terminal_state_prevents_transitions(self):
        """Terminal states should prevent any transitions."""
        job = Job(
            job_id=JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11"),
            client_id=ClientId("client-1"),
            request_client_id="req-client-123",
            job_state=JobState.COMPLETED,
            client_name="abc123",
        )
        with pytest.raises(TerminalStateViolationError):
            job.start()
        with pytest.raises(TerminalStateViolationError):
            job.complete()
        with pytest.raises(TerminalStateViolationError):
            job.fail()
        with pytest.raises(TerminalStateViolationError):
            job.cancel()

    def test_tombstone_job(self):
        """Job should be tombstonable."""
        job = Job(
            job_id=JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11"),
            client_id=ClientId("client-1"),
            request_client_id="req-client-123",
            job_state=JobState.COMPLETED,
            client_name="abc123",
        )
        job.tombstone()
        assert job.tombstoned is True
        assert job.version == 2

    def test_job_state_predicates(self):
        """Job state predicate methods should work correctly."""
        job = Job(
            job_id=JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11"),
            client_id=ClientId("client-1"),
            request_client_id="req-client-123",
            job_state=JobState.COMPLETED,
            client_name="abc123",
        )
        assert job.is_completed() is True
        assert job.is_failed() is False
        assert job.is_cancelled() is False
        assert job.is_in_progress() is False


================================================
FILE: build_stream/tests/unit/core/jobs/entities/test_stage.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for Stage entity."""

import pytest

from build_stream.core.jobs.entities.stage import Stage
from build_stream.core.jobs.exceptions import (
    InvalidStateTransitionError,
    TerminalStateViolationError,
)
from build_stream.core.jobs.value_objects import JobId, StageName, StageState


class TestStage:
    """Tests for Stage entity."""

    def test_create_stage(self):
        """Stage should be created with initial state."""
        stage = Stage(
            job_id=JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11"),
            stage_name=StageName("parse-catalog"),
        )
        assert stage.stage_state == StageState.PENDING
        assert stage.attempt == 1
        assert stage.version == 1
        assert stage.started_at is None
        assert stage.ended_at is None

    def test_start_stage(self):
        """Stage should transition from PENDING to IN_PROGRESS."""
        stage = Stage(
            job_id=JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11"),
            stage_name=StageName("parse-catalog"),
        )
        stage.start()
        assert stage.stage_state == StageState.IN_PROGRESS
        assert stage.started_at is not None
        assert stage.version == 2

    def test_start_stage_invalid_state(self):
        """Starting stage from non-PENDING state should fail."""
        stage = Stage(
            job_id=JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11"),
            stage_name=StageName("parse-catalog"),
            stage_state=StageState.IN_PROGRESS,
        )
        with pytest.raises(InvalidStateTransitionError):
            stage.start()

    def test_complete_stage(self):
        """Stage should transition from IN_PROGRESS to COMPLETED."""
        stage = Stage(
            job_id=JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11"),
            stage_name=StageName("parse-catalog"),
            stage_state=StageState.IN_PROGRESS,
        )
        stage.complete()
        assert stage.stage_state == StageState.COMPLETED
        assert stage.ended_at is not None
        assert stage.version == 2

    def test_fail_stage(self):
        """Stage should transition from IN_PROGRESS to FAILED with error details."""
        stage = Stage(
            job_id=JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11"),
            stage_name=StageName("parse-catalog"),
            stage_state=StageState.IN_PROGRESS,
        )
        stage.fail(error_code="ERR_PARSE", error_summary="Parse failed")
        assert stage.stage_state == StageState.FAILED
        assert stage.error_code == "ERR_PARSE"
        assert stage.error_summary == "Parse failed"
        assert stage.ended_at is not None
        assert stage.version == 2

    def test_skip_stage(self):
        """Stage should transition from PENDING to SKIPPED."""
        stage = Stage(
            job_id=JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11"),
            stage_name=StageName("parse-catalog"),
        )
        stage.skip()
        assert stage.stage_state == StageState.SKIPPED
        assert stage.ended_at is not None
        assert stage.version == 2

    def test_cancel_stage_from_pending(self):
        """Stage should be cancellable from PENDING state."""
        stage = Stage(
            job_id=JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11"),
            stage_name=StageName("parse-catalog"),
        )
        stage.cancel()
        assert stage.stage_state == StageState.CANCELLED
        assert stage.ended_at is not None

    def test_cancel_stage_from_in_progress(self):
        """Stage should be cancellable from IN_PROGRESS state."""
        stage = Stage(
            job_id=JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11"),
            stage_name=StageName("parse-catalog"),
            stage_state=StageState.IN_PROGRESS,
        )
        stage.cancel()
        assert stage.stage_state == StageState.CANCELLED

    def test_terminal_state_prevents_transitions(self):
        """Terminal states should prevent any transitions."""
        stage = Stage(
            job_id=JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11"),
            stage_name=StageName("parse-catalog"),
            stage_state=StageState.COMPLETED,
        )
        with pytest.raises(TerminalStateViolationError):
            stage.start()
        with pytest.raises(TerminalStateViolationError):
            stage.complete()
        with pytest.raises(TerminalStateViolationError):
            stage.fail("ERR", "Error")
        with pytest.raises(TerminalStateViolationError):
            stage.skip()
        with pytest.raises(TerminalStateViolationError):
            stage.cancel()


================================================
FILE: build_stream/tests/unit/core/jobs/test_exceptions.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for Job domain exceptions."""

import pytest

from build_stream.core.jobs.exceptions import (
    IdempotencyConflictError,
    InvalidStateTransitionError,
    JobAlreadyExistsError,
    JobDomainError,
    JobNotFoundError,
    OptimisticLockError,
    StageNotFoundError,
    TerminalStateViolationError,
)


class TestJobDomainError:
    """Tests for base JobDomainError."""

    def test_basic_error(self):
        """Base error should store message."""
        error = JobDomainError("Test error")
        assert str(error) == "Test error"
        assert error.message == "Test error"
        assert error.correlation_id is None

    def test_error_with_correlation_id(self):
        """Error should store correlation ID."""
        error = JobDomainError("Test error", correlation_id="corr-123")
        assert error.correlation_id == "corr-123"


class TestJobNotFoundError:
    """Tests for JobNotFoundError."""

    def test_error_message(self):
        """Error should include job ID in message."""
        error = JobNotFoundError("job-123")
        assert "job-123" in str(error)
        assert error.job_id == "job-123"

    def test_with_correlation_id(self):
        """Error should store correlation ID."""
        error = JobNotFoundError("job-123", correlation_id="corr-456")
        assert error.correlation_id == "corr-456"


class TestJobAlreadyExistsError:
    """Tests for JobAlreadyExistsError."""

    def test_error_message(self):
        """Error should include job ID in message."""
        error = JobAlreadyExistsError("job-123")
        assert "job-123" in str(error)
        assert error.job_id == "job-123"


class TestInvalidStateTransitionError:
    """Tests for InvalidStateTransitionError."""

    def test_error_message(self):
        """Error should include transition details."""
        error = InvalidStateTransitionError(
            entity_type="Job",
            entity_id="job-123",
            from_state="CREATED",
            to_state="COMPLETED"
        )
        assert "Job" in str(error)
        assert "job-123" in str(error)
        assert "CREATED" in str(error)
        assert "COMPLETED" in str(error)

    def test_error_attributes(self):
        """Error should store all transition details."""
        error = InvalidStateTransitionError(
            entity_type="Stage",
            entity_id="stage-456",
            from_state="PENDING",
            to_state="FAILED"
        )
        assert error.entity_type == "Stage"
        assert error.entity_id == "stage-456"
        assert error.from_state == "PENDING"
        assert error.to_state == "FAILED"


class TestTerminalStateViolationError:
    """Tests for TerminalStateViolationError."""

    def test_error_message(self):
        """Error should include entity and state details."""
        error = TerminalStateViolationError(
            entity_type="Job",
            entity_id="job-123",
            state="COMPLETED"
        )
        assert "Job" in str(error)
        assert "job-123" in str(error)
        assert "COMPLETED" in str(error)
        assert "terminal" in str(error).lower()

    def test_error_attributes(self):
        """Error should store entity details."""
        error = TerminalStateViolationError(
            entity_type="Stage",
            entity_id="stage-456",
            state="FAILED"
        )
        assert error.entity_type == "Stage"
        assert error.entity_id == "stage-456"
        assert error.state == "FAILED"


class TestOptimisticLockError:
    """Tests for OptimisticLockError."""

    def test_error_message(self):
        """Error should include version conflict details."""
        error = OptimisticLockError(
            entity_type="Job",
            entity_id="job-123",
            expected_version=5,
            actual_version=7
        )
        assert "Job" in str(error)
        assert "job-123" in str(error)
        assert "5" in str(error)
        assert "7" in str(error)

    def test_error_attributes(self):
        """Error should store version details."""
        error = OptimisticLockError(
            entity_type="Stage",
            entity_id="stage-456",
            expected_version=2,
            actual_version=3
        )
        assert error.entity_type == "Stage"
        assert error.entity_id == "stage-456"
        assert error.expected_version == 2
        assert error.actual_version == 3


class TestIdempotencyConflictError:
    """Tests for IdempotencyConflictError."""

    def test_error_message(self):
        """Error should include idempotency key and job ID."""
        error = IdempotencyConflictError(
            idempotency_key="key-123",
            existing_job_id="job-456"
        )
        assert "key-123" in str(error)
        assert "job-456" in str(error)
        assert "fingerprint" in str(error).lower()

    def test_error_attributes(self):
        """Error should store idempotency details."""
        error = IdempotencyConflictError(
            idempotency_key="key-789",
            existing_job_id="job-abc"
        )
        assert error.idempotency_key == "key-789"
        assert error.existing_job_id == "job-abc"


class TestStageNotFoundError:
    """Tests for StageNotFoundError."""

    def test_error_message(self):
        """Error should include job ID and stage name."""
        error = StageNotFoundError(
            job_id="job-123",
            stage_name="parse-catalog"
        )
        assert "job-123" in str(error)
        assert "parse-catalog" in str(error)

    def test_error_attributes(self):
        """Error should store job and stage details."""
        error = StageNotFoundError(
            job_id="job-456",
            stage_name="build-image"
        )
        assert error.job_id == "job-456"
        assert error.stage_name == "build-image"


================================================
FILE: build_stream/tests/unit/core/jobs/test_value_objects.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for Job domain value objects."""

import uuid

import pytest

from build_stream.core.jobs.value_objects import (
    ClientId,
    CorrelationId,
    IdempotencyKey,
    JobId,
    JobState,
    RequestFingerprint,
    StageName,
    StageState,
    StageType,
)


class TestJobId:
    """Tests for JobId value object."""

    @staticmethod
    def _uuid_str() -> str:
        """Generate a UUID string for tests (version-agnostic)."""
        return str(uuid.uuid4())

    def test_valid_uuid_any_version(self):
        """Any valid UUID (e.g., v4) should be accepted."""
        raw = self._uuid_str()
        job_id = JobId(raw)
        assert job_id.value == raw

    def test_uuid_is_normalized_lowercase(self):
        """Uppercase UUID strings are normalized to canonical lowercase."""
        raw = self._uuid_str()
        upper_raw = raw.upper()
        job_id = JobId(upper_raw)
        assert job_id.value == raw.lower()

    def test_invalid_uuid_format(self):
        """Malformed UUID should be rejected."""
        with pytest.raises(ValueError, match="Invalid UUID format"):
            JobId("not-a-uuid")

    def test_empty_string(self):
        """Empty string should be rejected."""
        with pytest.raises(ValueError, match="Invalid UUID format"):
            JobId("")

    def test_exceeds_maximum_length(self):
        """String longer than max length should be rejected."""
        with pytest.raises(ValueError, match="length cannot exceed"):
            JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11-extra")

    def test_immutability(self):
        """JobId should be immutable (frozen dataclass)."""
        job_id = JobId(self._uuid_str())
        with pytest.raises(AttributeError):
            job_id.value = "018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a12"

    def test_str_representation(self):
        """String representation should return value."""
        raw = self._uuid_str()
        job_id = JobId(raw)
        assert str(job_id) == raw

    def test_equality(self):
        """Two JobIds with same value should be equal."""
        raw = self._uuid_str()
        job_id1 = JobId(raw)
        job_id2 = JobId(raw.upper())
        assert job_id1 == job_id2


class TestCorrelationId:
    """Tests for CorrelationId value object."""

    @staticmethod
    def _uuid_str() -> str:
        """Generate a UUID string for tests (version-agnostic)."""
        return str(uuid.uuid4())

    def test_valid_uuid_any_version(self):
        """Any valid UUID (e.g., v4) should be accepted."""
        raw = self._uuid_str()
        corr_id = CorrelationId(raw)
        assert corr_id.value == raw

    def test_invalid_uuid_format(self):
        """Invalid UUID format should be rejected."""
        with pytest.raises(ValueError, match="Invalid UUID format"):
            CorrelationId("invalid-correlation-id")

    def test_exceeds_maximum_length(self):
        """String longer than max length should be rejected."""
        with pytest.raises(ValueError, match="length cannot exceed"):
            CorrelationId("018f3c4b-2d9e-7d1a-8a2b-111111111111-extra")

    def test_immutability(self):
        """CorrelationId should be immutable."""
        corr_id = CorrelationId(self._uuid_str())
        with pytest.raises(AttributeError):
            corr_id.value = "018f3c4b-2d9e-7d1a-8a2b-222222222222"


class TestStageName:
    """Tests for StageName value object."""

    def test_valid_stage_names(self):
        """All canonical stage names should be accepted."""
        for stage in StageType:
            stage_name = StageName(stage.value)
            assert stage_name.value == stage.value
            assert stage_name.as_enum() == stage

    def test_invalid_stage_name(self):
        """Non-canonical stage name should be rejected."""
        with pytest.raises(ValueError, match="Invalid stage name"):
            StageName("invalid-stage")

    def test_empty_string(self):
        """Empty string should be rejected."""
        with pytest.raises(ValueError, match="Invalid stage name"):
            StageName("")

    def test_case_sensitive(self):
        """Stage names are case-sensitive."""
        with pytest.raises(ValueError, match="Invalid stage name"):
            StageName("Parse-Catalog")

    def test_exceeds_maximum_length(self):
        """String longer than max length should be rejected."""
        with pytest.raises(ValueError, match="length cannot exceed"):
            StageName("this-stage-name-is-way-too-long-for-validation")

    def test_immutability(self):
        """StageName should be immutable."""
        stage = StageName("parse-catalog")
        with pytest.raises(AttributeError):
            stage.value = "build-image"

    def test_canonical_stages_count(self):
        """Verify we have exactly 6 canonical stages."""
        assert len(StageType) == 6


class TestIdempotencyKey:
    """Tests for IdempotencyKey value object."""

    def test_valid_key(self):
        """Valid key within length bounds should be accepted."""
        key = IdempotencyKey("key-001")
        assert key.value == "key-001"

    def test_minimum_length(self):
        """Single character key should be accepted."""
        key = IdempotencyKey("a")
        assert key.value == "a"

    def test_maximum_length(self):
        """255 character key should be accepted."""
        long_key = "x" * 255
        key = IdempotencyKey(long_key)
        assert key.value == long_key

    def test_empty_string(self):
        """Empty string should be rejected."""
        with pytest.raises(ValueError, match="length must be between"):
            IdempotencyKey("")

    def test_exceeds_maximum_length(self):
        """Key longer than 255 characters should be rejected."""
        too_long = "x" * 256
        with pytest.raises(ValueError, match="length must be between"):
            IdempotencyKey(too_long)

    def test_immutability(self):
        """IdempotencyKey should be immutable."""
        key = IdempotencyKey("key-001")
        with pytest.raises(AttributeError):
            key.value = "key-002"


class TestRequestFingerprint:
    """Tests for RequestFingerprint value object."""

    def test_valid_sha256(self):
        """Valid SHA-256 hex string should be accepted."""
        fingerprint = RequestFingerprint(
            "9f86d081884c7d659a2feaa0c55ad015a3bf4f1b2b0b822cd15d6c15b0f00a08"
        )
        assert len(fingerprint.value) == 64

    def test_valid_sha256_uppercase(self):
        """SHA-256 with uppercase hex should be accepted."""
        fingerprint = RequestFingerprint(
            "9F86D081884C7D659A2FEAA0C55AD015A3BF4F1B2B0B822CD15D6C15B0F00A08"
        )
        assert len(fingerprint.value) == 64

    def test_invalid_length(self):
        """String with wrong length should be rejected."""
        with pytest.raises(ValueError, match="Invalid SHA-256 format"):
            RequestFingerprint("abc123")

    def test_invalid_characters(self):
        """String with non-hex characters should be rejected."""
        with pytest.raises(ValueError, match="Invalid SHA-256 format"):
            RequestFingerprint("g" * 64)

    def test_empty_string(self):
        """Empty string should be rejected."""
        with pytest.raises(ValueError, match="Invalid SHA-256 format"):
            RequestFingerprint("")

    def test_immutability(self):
        """RequestFingerprint should be immutable."""
        fp = RequestFingerprint(
            "9f86d081884c7d659a2feaa0c55ad015a3bf4f1b2b0b822cd15d6c15b0f00a08"
        )
        with pytest.raises(AttributeError):
            fp.value = "0" * 64


class TestClientId:
    """Tests for ClientId value object."""

    def test_valid_client_id(self):
        """Valid client ID should be accepted."""
        client_id = ClientId("client-1")
        assert client_id.value == "client-1"

    def test_empty_string(self):
        """Empty string should be rejected."""
        with pytest.raises(ValueError, match="cannot be empty"):
            ClientId("")

    def test_whitespace_only(self):
        """Whitespace-only string should be rejected."""
        with pytest.raises(ValueError, match="cannot be empty"):
            ClientId("   ")

    def test_exceeds_maximum_length(self):
        """String longer than max length should be rejected."""
        with pytest.raises(ValueError, match="length cannot exceed"):
            ClientId("x" * 129)

    def test_immutability(self):
        """ClientId should be immutable."""
        client_id = ClientId("client-1")
        with pytest.raises(AttributeError):
            client_id.value = "client-2"


class TestJobState:
    """Tests for JobState enum."""

    def test_all_states_exist(self):
        """All expected job states should exist."""
        assert JobState.CREATED == "CREATED"
        assert JobState.IN_PROGRESS == "IN_PROGRESS"
        assert JobState.COMPLETED == "COMPLETED"
        assert JobState.FAILED == "FAILED"
        assert JobState.CANCELLED == "CANCELLED"

    def test_terminal_states(self):
        """Terminal states should return True for is_terminal()."""
        assert JobState.COMPLETED.is_terminal() is True
        assert JobState.FAILED.is_terminal() is True
        assert JobState.CANCELLED.is_terminal() is True

    def test_non_terminal_states(self):
        """Non-terminal states should return False for is_terminal()."""
        assert JobState.CREATED.is_terminal() is False
        assert JobState.IN_PROGRESS.is_terminal() is False

    def test_state_count(self):
        """Verify we have exactly 5 job states."""
        assert len(JobState) == 5


class TestStageState:
    """Tests for StageState enum."""

    def test_all_states_exist(self):
        """All expected stage states should exist."""
        assert StageState.PENDING == "PENDING"
        assert StageState.IN_PROGRESS == "IN_PROGRESS"
        assert StageState.COMPLETED == "COMPLETED"
        assert StageState.FAILED == "FAILED"
        assert StageState.SKIPPED == "SKIPPED"
        assert StageState.CANCELLED == "CANCELLED"

    def test_terminal_states(self):
        """Terminal states should return True for is_terminal()."""
        assert StageState.COMPLETED.is_terminal() is True
        assert StageState.FAILED.is_terminal() is True
        assert StageState.SKIPPED.is_terminal() is True
        assert StageState.CANCELLED.is_terminal() is True

    def test_non_terminal_states(self):
        """Non-terminal states should return False for is_terminal()."""
        assert StageState.PENDING.is_terminal() is False
        assert StageState.IN_PROGRESS.is_terminal() is False

    def test_state_count(self):
        """Verify we have exactly 6 stage states."""
        assert len(StageState) == 6


================================================
FILE: build_stream/tests/unit/core/localrepo/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

================================================
FILE: build_stream/tests/unit/core/localrepo/test_entities.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for Local Repository entities."""

import pytest

from core.jobs.value_objects import CorrelationId, JobId
from core.localrepo.entities import (
    PlaybookRequest,
    PlaybookResult,
)
from core.localrepo.value_objects import (
    ExecutionTimeout,
    ExtraVars,
    PlaybookPath,
)


class TestPlaybookRequest:
    """Tests for PlaybookRequest entity."""

    def _make_request(self, **overrides):
        """Helper to create a PlaybookRequest with defaults."""
        defaults = {
            "job_id": "018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11",
            "stage_name": "create-local-repository",
            "playbook_path": PlaybookPath("local_repo.yml"),
            "extra_vars": ExtraVars(values={}),
            "correlation_id": "019bf590-1234-7890-abcd-ef1234567890",
            "timeout": ExecutionTimeout.default(),
            "submitted_at": "2026-02-05T14:30:00Z",
            "request_id": "req-001",
        }
        defaults.update(overrides)
        return PlaybookRequest(**defaults)

    def test_to_dict_contains_all_fields(self):
        """to_dict should contain all required fields."""
        request = self._make_request()
        data = request.to_dict()
        assert data["job_id"] == "018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11"
        assert data["stage_name"] == "create-local-repository"
        assert data["playbook_path"] == "local_repo.yml"
        assert data["extra_vars"] == {}
        assert data["timeout_minutes"] == 30
        assert data["submitted_at"] == "2026-02-05T14:30:00Z"
        assert data["request_id"] == "req-001"

    def test_generate_filename_format(self):
        """Filename should follow naming convention."""
        request = self._make_request()
        filename = request.generate_filename()
        assert filename.startswith("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11")
        assert "create-local-repository" in filename
        assert filename.endswith(".json")

    def test_immutability(self):
        """PlaybookRequest should be immutable."""
        request = self._make_request()
        with pytest.raises(AttributeError):
            request.job_id = "other-id"


class TestPlaybookResult:
    """Tests for PlaybookResult entity."""

    def test_success_result(self):
        """Successful result should report is_success=True."""
        result = PlaybookResult(
            job_id="job-1",
            stage_name="create-local-repository",
            request_id="req-1",
            status="success",
            exit_code=0,
        )
        assert result.is_success is True
        assert result.is_failed is False

    def test_failed_result(self):
        """Failed result should report is_failed=True."""
        result = PlaybookResult(
            job_id="job-1",
            stage_name="create-local-repository",
            request_id="req-1",
            status="failed",
            exit_code=1,
            error_code="PLAYBOOK_FAILED",
            error_summary="Playbook failed",
        )
        assert result.is_success is False
        assert result.is_failed is True

    def test_from_dict_success(self):
        """from_dict should parse valid dictionary."""
        data = {
            "job_id": "job-1",
            "stage_name": "create-local-repository",
            "request_id": "req-1",
            "status": "success",
            "exit_code": 0,
            "stdout": "output",
            "stderr": "",
            "started_at": "2026-02-05T14:30:00Z",
            "completed_at": "2026-02-05T14:40:00Z",
            "duration_seconds": 600,
            "timestamp": "2026-02-05T14:40:00Z",
        }
        result = PlaybookResult.from_dict(data)
        assert result.job_id == "job-1"
        assert result.is_success is True
        assert result.duration_seconds == 600

    def test_from_dict_missing_required_field(self):
        """from_dict should raise KeyError for missing required fields."""
        data = {"stage_name": "create-local-repository", "status": "success"}
        with pytest.raises(KeyError):
            PlaybookResult.from_dict(data)

    def test_from_dict_with_optional_fields(self):
        """from_dict should handle missing optional fields gracefully."""
        data = {
            "job_id": "job-1",
            "stage_name": "create-local-repository",
            "status": "failed",
        }
        result = PlaybookResult.from_dict(data)
        assert result.exit_code == -1
        assert result.stdout == ""
        assert result.error_code is None

    def test_immutability(self):
        """PlaybookResult should be immutable."""
        result = PlaybookResult(
            job_id="job-1",
            stage_name="create-local-repository",
            request_id="req-1",
            status="success",
            exit_code=0,
        )
        with pytest.raises(AttributeError):
            result.status = "failed"


================================================
FILE: build_stream/tests/unit/core/localrepo/test_exceptions.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for Local Repository exceptions."""

import pytest

from core.localrepo.exceptions import (
    InputDirectoryInvalidError,
    InputFilesMissingError,
    LocalRepoDomainError,
    QueueUnavailableError,
)


class TestLocalRepoDomainError:
    """Tests for base domain error."""

    def test_message_stored(self):
        """Error message should be stored."""
        err = LocalRepoDomainError("test error")
        assert err.message == "test error"

    def test_correlation_id_stored(self):
        """Correlation ID should be stored."""
        err = LocalRepoDomainError("test", correlation_id="corr-123")
        assert err.correlation_id == "corr-123"

    def test_correlation_id_defaults_none(self):
        """Correlation ID should default to None."""
        err = LocalRepoDomainError("test")
        assert err.correlation_id is None


class TestQueueUnavailableError:
    """Tests for QueueUnavailableError."""

    def test_attributes_stored(self):
        """Queue path and reason should be stored."""
        err = QueueUnavailableError(queue_path="/queue", reason="not mounted")
        assert err.queue_path == "/queue"
        assert err.reason == "not mounted"


class TestInputFilesMissingError:
    """Tests for InputFilesMissingError."""

    def test_attributes_stored(self):
        """Job ID and input path should be stored."""
        err = InputFilesMissingError(job_id="job-1", input_path="/input")
        assert err.job_id == "job-1"
        assert err.input_path == "/input"

    def test_message_suggests_generate_api(self):
        """Error message should suggest running GenerateInputFiles API."""
        err = InputFilesMissingError(job_id="job-1", input_path="/input")
        assert "GenerateInputFiles" in err.message


class TestInputDirectoryInvalidError:
    """Tests for InputDirectoryInvalidError."""

    def test_attributes_stored(self):
        """All attributes should be stored."""
        err = InputDirectoryInvalidError(
            job_id="job-1", input_path="/input", reason="empty"
        )
        assert err.job_id == "job-1"
        assert err.input_path == "/input"
        assert err.reason == "empty"


================================================
FILE: build_stream/tests/unit/core/localrepo/test_services.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for Local Repository services."""

import os
import tempfile
from pathlib import Path
from unittest.mock import MagicMock, patch

import pytest

from core.localrepo.entities import PlaybookRequest, PlaybookResult
from core.localrepo.exceptions import (
    InputFilesMissingError,
    QueueUnavailableError,
)
from core.localrepo.services import (
    InputFileService,
    PlaybookQueueRequestService,
    PlaybookQueueResultService,
)
from core.localrepo.value_objects import (
    ExecutionTimeout,
    ExtraVars,
    PlaybookPath,
)


class TestInputFileService:
    """Tests for InputFileService."""

    def _make_service(self, input_repo=None):
        """Create InputFileService with mock or provided repo."""
        if input_repo is None:
            input_repo = MagicMock()
        return InputFileService(input_repo=input_repo)

    def test_prepare_success(self, tmp_path):
        """Successful preparation should return True."""
        source = tmp_path / "source"
        source.mkdir()
        (source / "software_config.json").write_text('{"key": "value"}')
        (source / "config").mkdir()
        (source / "config" / "nested.json").write_text('{"nested": "value"}')
        dest = tmp_path / "dest"

        repo = MagicMock()
        repo.get_source_input_repository_path.return_value = source
        repo.get_destination_input_repository_path.return_value = dest
        repo.validate_input_directory.return_value = True

        service = self._make_service(input_repo=repo)
        result = service.prepare_playbook_input(job_id="job-1")

        assert result is True
        assert (dest / "software_config.json").exists()
        assert (dest / "config" / "nested.json").exists()

    def test_prepare_missing_input_raises(self):
        """Missing input files should raise InputFilesMissingError."""
        repo = MagicMock()
        repo.get_source_input_repository_path.return_value = Path("/nonexistent")
        repo.validate_input_directory.return_value = False

        service = self._make_service(input_repo=repo)

        with pytest.raises(InputFilesMissingError):
            service.prepare_playbook_input(job_id="job-1")

    def test_prepare_copies_only_specific_files(self, tmp_path):
        """Should copy only software_config.json and config directory."""
        source = tmp_path / "source"
        source.mkdir()

        # Create the files that should be copied
        (source / "software_config.json").write_text('{"software": "config"}')
        config_dir = source / "config"
        config_dir.mkdir()
        (config_dir / "nested.txt").write_text("nested content")

        # Create files that should NOT be copied
        (source / "other_file.txt").write_text("should not be copied")
        other_dir = source / "other_dir"
        other_dir.mkdir()
        (other_dir / "ignored.txt").write_text("should be ignored")

        dest = tmp_path / "dest"

        repo = MagicMock()
        repo.get_source_input_repository_path.return_value = source
        repo.get_destination_input_repository_path.return_value = dest
        repo.validate_input_directory.return_value = True

        service = self._make_service(input_repo=repo)
        service.prepare_playbook_input(job_id="job-1")

        # Should exist - these are copied
        assert (dest / "software_config.json").exists()
        assert (dest / "config" / "nested.txt").exists()

        # Should NOT exist - these are ignored
        assert not (dest / "other_file.txt").exists()
        assert not (dest / "other_dir").exists()

    def test_prepare_handles_missing_specific_files(self, tmp_path):
        """Should succeed even when software_config.json or config directory don't exist."""
        source = tmp_path / "source"
        source.mkdir()

        # Create only files that should NOT be copied
        (source / "other_file.txt").write_text("should not be copied")
        other_dir = source / "other_dir"
        other_dir.mkdir()
        (other_dir / "ignored.txt").write_text("should be ignored")

        dest = tmp_path / "dest"

        repo = MagicMock()
        repo.get_source_input_repository_path.return_value = source
        repo.get_destination_input_repository_path.return_value = dest
        repo.validate_input_directory.return_value = True

        service = self._make_service(input_repo=repo)
        result = service.prepare_playbook_input(job_id="job-1")

        # Should still succeed
        assert result is True

        # Destination should be empty (no specific files copied)
        assert not any(dest.iterdir())


class TestPlaybookQueueRequestService:
    """Tests for PlaybookQueueRequestService."""

    def _make_request(self):
        """Helper to create a PlaybookRequest."""
        return PlaybookRequest(
            job_id="018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11",
            stage_name="create-local-repository",
            playbook_path=PlaybookPath("local_repo.yml"),
            extra_vars=ExtraVars(values={}),
            correlation_id="019bf590-1234-7890-abcd-ef1234567890",
            timeout=ExecutionTimeout.default(),
            submitted_at="2026-02-05T14:30:00Z",
            request_id="req-001",
        )

    def test_submit_request_success(self):
        """Successful submission should return file path."""
        repo = MagicMock()
        repo.is_available.return_value = True
        repo.write_request.return_value = Path("/queue/requests/test.json")

        service = PlaybookQueueRequestService(request_repo=repo)
        result = service.submit_request(self._make_request())

        assert result == Path("/queue/requests/test.json")
        repo.write_request.assert_called_once()

    def test_submit_request_queue_unavailable(self):
        """Unavailable queue should raise QueueUnavailableError."""
        repo = MagicMock()
        repo.is_available.return_value = False

        service = PlaybookQueueRequestService(request_repo=repo)

        with pytest.raises(QueueUnavailableError):
            service.submit_request(self._make_request())


class TestPlaybookQueueResultService:
    """Tests for PlaybookQueueResultService."""

    def test_poll_results_processes_files(self):
        """Should process available result files and invoke callback."""
        result = PlaybookResult(
            job_id="job-1",
            stage_name="create-local-repository",
            request_id="req-1",
            status="success",
            exit_code=0,
        )

        repo = MagicMock()
        repo.is_available.return_value = True
        repo.get_unprocessed_results.return_value = [Path("/results/r1.json")]
        repo.read_result.return_value = result

        callback = MagicMock()
        service = PlaybookQueueResultService(result_repo=repo)
        count = service.poll_results(callback=callback)

        assert count == 1
        callback.assert_called_once_with(result)
        repo.archive_result.assert_called_once()

    def test_poll_results_queue_unavailable(self):
        """Unavailable queue should return 0 processed."""
        repo = MagicMock()
        repo.is_available.return_value = False

        service = PlaybookQueueResultService(result_repo=repo)
        count = service.poll_results(callback=MagicMock())

        assert count == 0

    def test_poll_results_handles_parse_error(self):
        """Parse errors should be logged and skipped."""
        repo = MagicMock()
        repo.is_available.return_value = True
        repo.get_unprocessed_results.return_value = [Path("/results/bad.json")]
        repo.read_result.side_effect = ValueError("bad json")

        callback = MagicMock()
        service = PlaybookQueueResultService(result_repo=repo)
        count = service.poll_results(callback=callback)

        assert count == 0
        callback.assert_not_called()
        repo.archive_result.assert_not_called()

    def test_poll_results_empty_queue(self):
        """Empty queue should return 0 processed."""
        repo = MagicMock()
        repo.is_available.return_value = True
        repo.get_unprocessed_results.return_value = []

        service = PlaybookQueueResultService(result_repo=repo)
        count = service.poll_results(callback=MagicMock())

        assert count == 0


================================================
FILE: build_stream/tests/unit/core/localrepo/test_value_objects.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for Local Repository value objects."""

import pytest

from core.localrepo.value_objects import (
    ExecutionTimeout,
    ExtraVars,
    PlaybookPath,
)


class TestPlaybookPath:
    """Tests for PlaybookPath value object."""

    def test_valid_playbook_path(self):
        """Valid playbook filename should be accepted."""
        path = PlaybookPath("local_repo.yml")
        assert str(path) == "local_repo.yml"

    def test_valid_yaml_extension(self):
        """Filename with .yaml extension should be accepted."""
        path = PlaybookPath("test.yaml")
        assert str(path) == "test.yaml"

    def test_empty_path_raises(self):
        """Empty path should raise ValueError."""
        with pytest.raises(ValueError, match="cannot be empty"):
            PlaybookPath("")

    def test_whitespace_path_raises(self):
        """Whitespace-only path should raise ValueError."""
        with pytest.raises(ValueError, match="cannot be empty"):
            PlaybookPath("   ")

    def test_relative_path_raises(self):
        """Relative path should raise ValueError."""
        with pytest.raises(ValueError, match="Playbook name cannot contain path separators"):
            PlaybookPath("relative/path.yml")

    def test_path_traversal_raises(self):
        """Path with traversal should raise ValueError."""
        with pytest.raises(ValueError, match="Path traversal not allowed"):
            PlaybookPath("../etc/passwd.yml")

    def test_non_yaml_extension_raises(self):
        """Non-YAML extension should raise ValueError."""
        with pytest.raises(ValueError, match="Invalid playbook name format"):
            PlaybookPath("playbook.txt")

    def test_path_exceeds_max_length(self):
        """Path exceeding max length should raise ValueError."""
        long_name = "a" * 250 + ".yml"
        with pytest.raises(ValueError, match="cannot exceed"):
            PlaybookPath(long_name)

    def test_immutability(self):
        """PlaybookPath should be immutable (frozen dataclass)."""
        path = PlaybookPath("test.yml")
        with pytest.raises(AttributeError):
            path.value = "other.yml"


class TestExtraVars:
    """Tests for ExtraVars value object."""

    def test_valid_extra_vars(self):
        """Valid extra vars should be accepted."""
        extra = ExtraVars(values={"input_dir": "/opt/input", "version": "1.0"})
        assert extra.to_dict() == {"input_dir": "/opt/input", "version": "1.0"}

    def test_empty_extra_vars(self):
        """Empty extra vars should be accepted."""
        extra = ExtraVars(values={})
        assert extra.to_dict() == {}

    def test_none_values_raises(self):
        """None values should raise ValueError."""
        with pytest.raises(ValueError, match="cannot be None"):
            ExtraVars(values=None)

    def test_invalid_key_raises(self):
        """Key with invalid characters should raise ValueError."""
        with pytest.raises(ValueError, match="Invalid extra var key"):
            ExtraVars(values={"invalid-key": "value"})

    def test_key_starting_with_number_raises(self):
        """Key starting with number should raise ValueError."""
        with pytest.raises(ValueError, match="Invalid extra var key"):
            ExtraVars(values={"1invalid": "value"})

    def test_exceeds_max_keys(self):
        """Exceeding max keys should raise ValueError."""
        too_many = {f"key_{i}": f"val_{i}" for i in range(51)}
        with pytest.raises(ValueError, match="cannot exceed"):
            ExtraVars(values=too_many)

    def test_to_dict_returns_copy(self):
        """to_dict should return a copy, not the original."""
        original = {"key_one": "value"}
        extra = ExtraVars(values=original)
        result = extra.to_dict()
        result["new_key"] = "new_value"
        assert "new_key" not in extra.values

    def test_immutability(self):
        """ExtraVars should be immutable (frozen dataclass)."""
        extra = ExtraVars(values={"key": "val"})
        with pytest.raises(AttributeError):
            extra.values = {}


class TestExecutionTimeout:
    """Tests for ExecutionTimeout value object."""

    def test_valid_timeout(self):
        """Valid timeout should be accepted."""
        timeout = ExecutionTimeout(minutes=30)
        assert timeout.minutes == 30

    def test_default_timeout(self):
        """Default timeout should be 30 minutes."""
        timeout = ExecutionTimeout.default()
        assert timeout.minutes == 30

    def test_to_seconds(self):
        """to_seconds should convert correctly."""
        timeout = ExecutionTimeout(minutes=10)
        assert timeout.to_seconds() == 600

    def test_minimum_timeout(self):
        """Minimum timeout of 1 minute should be accepted."""
        timeout = ExecutionTimeout(minutes=1)
        assert timeout.minutes == 1

    def test_maximum_timeout(self):
        """Maximum timeout of 120 minutes should be accepted."""
        timeout = ExecutionTimeout(minutes=120)
        assert timeout.minutes == 120

    def test_below_minimum_raises(self):
        """Timeout below minimum should raise ValueError."""
        with pytest.raises(ValueError, match="must be between"):
            ExecutionTimeout(minutes=0)

    def test_above_maximum_raises(self):
        """Timeout above maximum should raise ValueError."""
        with pytest.raises(ValueError, match="must be between"):
            ExecutionTimeout(minutes=121)

    def test_negative_timeout_raises(self):
        """Negative timeout should raise ValueError."""
        with pytest.raises(ValueError, match="must be between"):
            ExecutionTimeout(minutes=-5)

    def test_str_representation(self):
        """String representation should include unit."""
        timeout = ExecutionTimeout(minutes=30)
        assert str(timeout) == "30m"

    def test_immutability(self):
        """ExecutionTimeout should be immutable (frozen dataclass)."""
        timeout = ExecutionTimeout(minutes=30)
        with pytest.raises(AttributeError):
            timeout.minutes = 60


================================================
FILE: build_stream/tests/unit/core/validate/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for validate domain module."""


================================================
FILE: build_stream/tests/unit/core/validate/test_entities.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for ValidateImageOnTest domain entities."""

import uuid
from unittest.mock import patch

from core.localrepo.value_objects import ExecutionTimeout, ExtraVars, PlaybookPath
from core.validate.entities import ValidateImageOnTestRequest


def _make_request(**overrides):
    """Create a ValidateImageOnTestRequest with sensible defaults."""
    defaults = {
        "job_id": str(uuid.uuid4()),
        "stage_name": "validate-image-on-test",
        "playbook_path": PlaybookPath("discovery.yml"),
        "extra_vars": ExtraVars({"job_id": str(uuid.uuid4())}),
        "correlation_id": str(uuid.uuid4()),
        "timeout": ExecutionTimeout(60),
        "submitted_at": "2026-02-17T10:30:00Z",
        "request_id": str(uuid.uuid4()),
    }
    defaults.update(overrides)
    return ValidateImageOnTestRequest(**defaults)


class TestValidateImageOnTestRequest:
    """Tests for ValidateImageOnTestRequest entity."""

    def test_create_valid_request(self):
        """Valid request should be created successfully."""
        request = _make_request()
        assert request.stage_name == "validate-image-on-test"
        assert str(request.playbook_path) == "discovery.yml"

    def test_immutability(self):
        """Request should be immutable (frozen dataclass)."""
        request = _make_request()
        try:
            request.job_id = "new-id"
            assert False, "Should have raised AttributeError"
        except AttributeError:
            pass

    def test_to_dict(self):
        """to_dict should serialize all fields correctly."""
        job_id = str(uuid.uuid4())
        corr_id = str(uuid.uuid4())
        req_id = str(uuid.uuid4())
        request = _make_request(
            job_id=job_id,
            correlation_id=corr_id,
            request_id=req_id,
        )
        result = request.to_dict()

        assert result["job_id"] == job_id
        assert result["stage_name"] == "validate-image-on-test"
        assert result["playbook_path"] == "discovery.yml"
        assert result["correlation_id"] == corr_id
        assert result["timeout_minutes"] == 60
        assert result["submitted_at"] == "2026-02-17T10:30:00Z"
        assert result["request_id"] == req_id
        assert isinstance(result["extra_vars"], dict)

    def test_generate_filename(self):
        """generate_filename should follow naming convention."""
        job_id = "test-job-id"
        request = _make_request(job_id=job_id)

        with patch("core.validate.entities.datetime") as mock_dt:
            mock_dt.now.return_value.strftime.return_value = "20260217_103000"
            mock_dt.now.return_value.isoformat.return_value = "2026-02-17T10:30:00+00:00"
            from datetime import timezone
            mock_dt.timezone = timezone
            filename = request.generate_filename()

        assert filename.startswith("test-job-id_validate-image-on-test_")
        assert filename.endswith(".json")


================================================
FILE: build_stream/tests/unit/core/validate/test_exceptions.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for ValidateImageOnTest domain exceptions."""

from core.validate.exceptions import (
    StageGuardViolationError,
    EnvironmentUnavailableError,
    ValidateDomainError,
    ValidationExecutionError,
)


class TestValidateDomainError:
    """Tests for ValidateDomainError base exception."""

    def test_message_stored(self):
        """Error message should be stored."""
        exc = ValidateDomainError("test error", "corr-123")
        assert exc.message == "test error"
        assert exc.correlation_id == "corr-123"

    def test_default_correlation_id(self):
        """Default correlation_id should be empty string."""
        exc = ValidateDomainError("test error")
        assert exc.correlation_id == ""

    def test_str_representation(self):
        """String representation should be the message."""
        exc = ValidateDomainError("test error")
        assert str(exc) == "test error"


class TestEnvironmentUnavailableError:
    """Tests for EnvironmentUnavailableError."""

    def test_inherits_from_base(self):
        """Should inherit from ValidateDomainError."""
        exc = EnvironmentUnavailableError("env down", "corr-456")
        assert isinstance(exc, ValidateDomainError)
        assert exc.message == "env down"
        assert exc.correlation_id == "corr-456"


class TestValidationExecutionError:
    """Tests for ValidationExecutionError."""

    def test_inherits_from_base(self):
        """Should inherit from ValidateDomainError."""
        exc = ValidationExecutionError("exec failed", "corr-789")
        assert isinstance(exc, ValidateDomainError)
        assert exc.message == "exec failed"


class TestStageGuardViolationError:
    """Tests for StageGuardViolationError."""

    def test_inherits_from_base(self):
        """Should inherit from ValidateDomainError."""
        exc = StageGuardViolationError("guard failed", "corr-abc")
        assert isinstance(exc, ValidateDomainError)
        assert exc.message == "guard failed"


================================================
FILE: build_stream/tests/unit/core/validate/test_services.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for ValidateImageOnTest domain services."""

import uuid

import pytest

from core.jobs.value_objects import CorrelationId
from core.localrepo.value_objects import ExecutionTimeout, ExtraVars, PlaybookPath
from core.validate.entities import ValidateImageOnTestRequest
from core.validate.services import ValidateQueueService


class MockQueueRepo:
    """Mock playbook queue request repository."""

    def __init__(self, should_fail: bool = False):
        self.written_requests = []
        self.should_fail = should_fail

    def write_request(self, request):
        if self.should_fail:
            raise IOError("Queue unavailable")
        self.written_requests.append(request)


def _make_request():
    """Create a ValidateImageOnTestRequest with sensible defaults."""
    return ValidateImageOnTestRequest(
        job_id=str(uuid.uuid4()),
        stage_name="validate-image-on-test",
        playbook_path=PlaybookPath("discovery.yml"),
        extra_vars=ExtraVars({"job_id": str(uuid.uuid4())}),
        correlation_id=str(uuid.uuid4()),
        timeout=ExecutionTimeout(60),
        submitted_at="2026-02-17T10:30:00Z",
        request_id=str(uuid.uuid4()),
    )


class TestValidateQueueService:
    """Tests for ValidateQueueService."""

    def test_submit_request_success(self):
        """Successful submission should write request to repo."""
        repo = MockQueueRepo()
        service = ValidateQueueService(queue_repo=repo)
        request = _make_request()
        corr_id = CorrelationId(str(uuid.uuid4()))

        service.submit_request(request=request, correlation_id=corr_id)

        assert len(repo.written_requests) == 1
        assert repo.written_requests[0] is request

    def test_submit_request_failure_propagates(self):
        """Queue failure should propagate the exception."""
        repo = MockQueueRepo(should_fail=True)
        service = ValidateQueueService(queue_repo=repo)
        request = _make_request()
        corr_id = CorrelationId(str(uuid.uuid4()))

        with pytest.raises(IOError, match="Queue unavailable"):
            service.submit_request(request=request, correlation_id=corr_id)


================================================
FILE: build_stream/tests/unit/infra/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


================================================
FILE: build_stream/tests/unit/infra/artifact_store/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.


================================================
FILE: build_stream/tests/unit/infra/artifact_store/conftest.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Shared fixtures for artifact store infrastructure tests."""

import pytest

from core.artifacts.value_objects import ArtifactKind, StoreHint
from infra.artifact_store.in_memory_artifact_store import InMemoryArtifactStore
from infra.artifact_store.in_memory_artifact_metadata import (
    InMemoryArtifactMetadataRepository,
)


@pytest.fixture
def artifact_store() -> InMemoryArtifactStore:
    """Fresh in-memory artifact store."""
    return InMemoryArtifactStore()


@pytest.fixture
def artifact_metadata_repo() -> InMemoryArtifactMetadataRepository:
    """Fresh in-memory artifact metadata repository."""
    return InMemoryArtifactMetadataRepository()


@pytest.fixture
def file_hint() -> StoreHint:
    """Store hint for a FILE artifact."""
    return StoreHint(
        namespace="catalog",
        label="catalog-file",
        tags={"job_id": "018f3c4b-7b5b-7a9d-b6c4-9f3b4f9b2c10"},
    )


@pytest.fixture
def archive_hint() -> StoreHint:
    """Store hint for an ARCHIVE artifact."""
    return StoreHint(
        namespace="catalog",
        label="root-jsons",
        tags={"job_id": "018f3c4b-7b5b-7a9d-b6c4-9f3b4f9b2c10"},
    )


@pytest.fixture
def sample_content() -> bytes:
    """Sample file content."""
    return b'{"name": "test-catalog", "version": "1.0"}'


@pytest.fixture
def sample_file_map() -> dict:
    """Sample file map for archive storage."""
    return {
        "x86_64/rhel/9.5/functional_layer.json": b'{"features": []}',
        "x86_64/rhel/9.5/base_os.json": b'{"packages": []}',
    }


================================================
FILE: build_stream/tests/unit/infra/artifact_store/test_in_memory_artifact_metadata.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for InMemoryArtifactMetadataRepository."""

import pytest

from core.artifacts.entities import ArtifactRecord
from core.artifacts.value_objects import (
    ArtifactDigest,
    ArtifactKey,
    ArtifactKind,
    ArtifactRef,
)
from core.jobs.value_objects import JobId, StageName, StageType
from infra.artifact_store.in_memory_artifact_metadata import (
    InMemoryArtifactMetadataRepository,
)


VALID_JOB_ID = "018f3c4b-7b5b-7a9d-b6c4-9f3b4f9b2c10"
VALID_JOB_ID_2 = "018f3c4b-7b5b-7a9d-b6c4-9f3b4f9b2c11"


def _make_ref(key_str: str = "ns/hash/label.bin") -> ArtifactRef:
    return ArtifactRef(
        key=ArtifactKey(key_str),
        digest=ArtifactDigest("a" * 64),
        size_bytes=100,
        uri=f"memory://{key_str}",
    )


def _make_record(
    job_id_str: str = VALID_JOB_ID,
    stage: str = "parse-catalog",
    label: str = "catalog-file",
    record_id: str = "rec-001",
) -> ArtifactRecord:
    return ArtifactRecord(
        id=record_id,
        job_id=JobId(job_id_str),
        stage_name=StageName(stage),
        label=label,
        artifact_ref=_make_ref(f"ns/{record_id}/{label}.bin"),
        kind=ArtifactKind.FILE,
        content_type="application/json",
    )


class TestSave:
    """Tests for saving artifact records."""

    def test_save_and_find(self, artifact_metadata_repo) -> None:
        """Test that save and find operations work correctly."""
        record = _make_record()
        artifact_metadata_repo.save(record)
        found = artifact_metadata_repo.find_by_job_stage_and_label(
            job_id=JobId(VALID_JOB_ID),
            stage_name=StageName(StageType.PARSE_CATALOG.value),
            label="catalog-file",
        )
        assert found is not None
        assert found.id == "rec-001"

    def test_save_overwrites_same_key(self, artifact_metadata_repo) -> None:
        """Test that save overwrites existing record with same key."""
        record1 = _make_record(record_id="rec-001")
        record2 = _make_record(record_id="rec-002")
        artifact_metadata_repo.save(record1)
        artifact_metadata_repo.save(record2)
        found = artifact_metadata_repo.find_by_job_stage_and_label(
            job_id=JobId(VALID_JOB_ID),
            stage_name=StageName(StageType.PARSE_CATALOG.value),
            label="catalog-file",
        )
        assert found is not None
        assert found.id == "rec-002"


class TestFind:
    """Tests for finding artifact records."""

    def test_find_not_found(self, artifact_metadata_repo) -> None:
        """Test that find returns None for nonexistent record."""
        found = artifact_metadata_repo.find_by_job_stage_and_label(
            job_id=JobId(VALID_JOB_ID),
            stage_name=StageName(StageType.PARSE_CATALOG.value),
            label="nonexistent",
        )
        assert found is None

    def test_find_by_job(self, artifact_metadata_repo) -> None:
        """Test that find_by_job returns correct records."""
        artifact_metadata_repo.save(_make_record(label="catalog-file", record_id="r1"))
        artifact_metadata_repo.save(
            _make_record(
                stage="generate-input-files",
                label="omnia-configs",
                record_id="r2",
            )
        )
        artifact_metadata_repo.save(
            _make_record(
                job_id_str=VALID_JOB_ID_2,
                label="catalog-file",
                record_id="r3",
            )
        )
        results = artifact_metadata_repo.find_by_job(JobId(VALID_JOB_ID))
        assert len(results) == 2

    def test_find_by_job_empty(self, artifact_metadata_repo) -> None:
        """Test that find_by_job returns empty list for no records."""
        results = artifact_metadata_repo.find_by_job(JobId(VALID_JOB_ID))
        assert results == []


class TestDelete:
    """Tests for deleting artifact records."""

    def test_delete_by_job(self, artifact_metadata_repo) -> None:
        """Test that delete_by_job removes correct records."""
        artifact_metadata_repo.save(_make_record(label="catalog-file", record_id="r1"))
        artifact_metadata_repo.save(
            _make_record(
                stage="generate-input-files",
                label="omnia-configs",
                record_id="r2",
            )
        )
        artifact_metadata_repo.save(
            _make_record(
                job_id_str=VALID_JOB_ID_2,
                label="catalog-file",
                record_id="r3",
            )
        )
        count = artifact_metadata_repo.delete_by_job(JobId(VALID_JOB_ID))
        assert count == 2
        assert artifact_metadata_repo.find_by_job(JobId(VALID_JOB_ID)) == []
        assert len(artifact_metadata_repo.find_by_job(JobId(VALID_JOB_ID_2))) == 1

    def test_delete_by_job_returns_zero(self, artifact_metadata_repo) -> None:
        """Test that delete_by_job returns 0 for no matching records."""
        count = artifact_metadata_repo.delete_by_job(JobId(VALID_JOB_ID))
        assert count == 0


================================================
FILE: build_stream/tests/unit/infra/artifact_store/test_in_memory_artifact_store.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for InMemoryArtifactStore."""

import hashlib
from pathlib import Path

import pytest

from core.artifacts.exceptions import (
    ArtifactAlreadyExistsError,
    ArtifactNotFoundError,
    ArtifactValidationError,
)
from core.artifacts.value_objects import ArtifactKind, StoreHint
from infra.artifact_store.in_memory_artifact_store import InMemoryArtifactStore


class TestStoreFile:
    """Tests for storing FILE artifacts."""

    def test_store_file_returns_artifact_ref(
        self, artifact_store, file_hint, sample_content
    ) -> None:
        """Test that storing a file artifact returns a valid ArtifactRef."""
        ref = artifact_store.store(
            hint=file_hint,
            kind=ArtifactKind.FILE,
            content=sample_content,
            content_type="application/json",
        )
        assert ref.key is not None
        assert ref.digest is not None
        assert ref.size_bytes == len(sample_content)
        assert ref.uri.startswith("memory://")

    def test_store_file_computes_sha256(
        self, artifact_store, file_hint, sample_content
    ) -> None:
        """Test that storing a file computes correct SHA256 digest."""
        ref = artifact_store.store(
            hint=file_hint,
            kind=ArtifactKind.FILE,
            content=sample_content,
            content_type="application/json",
        )
        expected = hashlib.sha256(sample_content).hexdigest()
        assert str(ref.digest) == expected

    def test_store_file_rejects_overwrite(
        self, artifact_store, file_hint, sample_content
    ) -> None:
        """Test that storing duplicate file artifacts raises ArtifactAlreadyExistsError."""
        artifact_store.store(
            hint=file_hint,
            kind=ArtifactKind.FILE,
            content=sample_content,
            content_type="application/json",
        )
        with pytest.raises(ArtifactAlreadyExistsError):
            artifact_store.store(
                hint=file_hint,
                kind=ArtifactKind.FILE,
                content=sample_content,
                content_type="application/json",
            )

    def test_store_file_without_content_raises(
        self, artifact_store, file_hint
    ) -> None:
        """Test that storing file without content raises ValueError."""
        with pytest.raises(ValueError, match="content is required"):
            artifact_store.store(
                hint=file_hint,
                kind=ArtifactKind.FILE,
                content_type="application/json",
            )

    def test_store_file_with_file_map_raises(
        self, artifact_store, file_hint, sample_content
    ) -> None:
        """Test that storing file with file_map raises ValueError."""
        with pytest.raises(ValueError, match="must not be provided for FILE"):
            artifact_store.store(
                hint=file_hint,
                kind=ArtifactKind.FILE,
                content=sample_content,
                file_map={"a.json": b"{}"},
                content_type="application/json",
            )


class TestStoreArchive:
    """Tests for storing ARCHIVE artifacts."""

    def test_store_archive_from_file_map(
        self, artifact_store, archive_hint, sample_file_map
    ) -> None:
        """Test that storing archive from file_map returns valid ArtifactRef."""
        ref = artifact_store.store(
            hint=archive_hint,
            kind=ArtifactKind.ARCHIVE,
            file_map=sample_file_map,
            content_type="application/zip",
        )
        assert ref.key is not None
        assert ref.size_bytes > 0

    def test_store_archive_from_directory(
        self, artifact_store, archive_hint, tmp_path
    ) -> None:
        """Test that storing archive from directory returns valid ArtifactRef."""
        # Create temp directory with files
        (tmp_path / "a.json").write_bytes(b'{"a": 1}')
        sub = tmp_path / "sub"
        sub.mkdir()
        (sub / "b.json").write_bytes(b'{"b": 2}')

        ref = artifact_store.store(
            hint=archive_hint,
            kind=ArtifactKind.ARCHIVE,
            source_directory=tmp_path,
            content_type="application/zip",
        )
        assert ref.key is not None
        assert ref.size_bytes > 0

    def test_store_archive_without_inputs_raises(
        self, artifact_store, archive_hint
    ) -> None:
        """Test that storing archive without file_map or source_directory raises ValueError."""
        with pytest.raises(ValueError, match="Either file_map or source_directory"):
            artifact_store.store(
                hint=archive_hint,
                kind=ArtifactKind.ARCHIVE,
                content_type="application/zip",
            )

    def test_store_archive_with_both_inputs_raises(
        self, artifact_store, archive_hint, tmp_path
    ) -> None:
        """Test that storing archive with both file_map and source_directory raises ValueError."""
        with pytest.raises(ValueError, match="not both"):
            artifact_store.store(
                hint=archive_hint,
                kind=ArtifactKind.ARCHIVE,
                file_map={"a.json": b"{}"},
                source_directory=tmp_path,
                content_type="application/zip",
            )

    def test_store_archive_with_content_raises(
        self, artifact_store, archive_hint
    ) -> None:
        """Test that storing archive with content parameter raises ValueError."""
        with pytest.raises(ValueError, match="must not be provided for ARCHIVE"):
            artifact_store.store(
                hint=archive_hint,
                kind=ArtifactKind.ARCHIVE,
                content=b"raw bytes",
                content_type="application/zip",
            )

    def test_store_archive_nonexistent_dir_raises(
        self, artifact_store, archive_hint
    ) -> None:
        """Test that storing archive with nonexistent directory raises ValueError."""
        with pytest.raises(ValueError, match="does not exist"):
            artifact_store.store(
                hint=archive_hint,
                kind=ArtifactKind.ARCHIVE,
                source_directory=Path("/nonexistent/dir"),
                content_type="application/zip",
            )


class TestRetrieve:
    """Tests for retrieving artifacts."""

    def test_retrieve_file(
        self, artifact_store, file_hint, sample_content
    ) -> None:
        """Test that retrieving a file artifact returns original content."""
        ref = artifact_store.store(
            hint=file_hint,
            kind=ArtifactKind.FILE,
            content=sample_content,
            content_type="application/json",
        )
        result = artifact_store.retrieve(
            key=ref.key, kind=ArtifactKind.FILE
        )
        assert result == sample_content

    def test_retrieve_archive(
        self, artifact_store, archive_hint, sample_file_map, tmp_path
    ) -> None:
        """Test that retrieving an archive extracts files to destination."""
        ref = artifact_store.store(
            hint=archive_hint,
            kind=ArtifactKind.ARCHIVE,
            file_map=sample_file_map,
            content_type="application/zip",
        )
        dest = tmp_path / "output"
        result = artifact_store.retrieve(
            key=ref.key, kind=ArtifactKind.ARCHIVE, destination=dest
        )
        assert isinstance(result, Path)
        # Check unpacked files exist
        for rel_path in sample_file_map:
            assert (result / rel_path).exists()

    def test_retrieve_archive_without_destination(
        self, artifact_store, archive_hint, sample_file_map
    ) -> None:
        """Test that retrieving archive without destination raises ValueError."""
        ref = artifact_store.store(
            hint=archive_hint,
            kind=ArtifactKind.ARCHIVE,
            file_map=sample_file_map,
            content_type="application/zip",
        )
        result = artifact_store.retrieve(
            key=ref.key, kind=ArtifactKind.ARCHIVE
        )
        assert isinstance(result, Path)
        assert result.is_dir()

    def test_retrieve_not_found_raises(self, artifact_store) -> None:
        """Test that retrieving nonexistent artifact raises ArtifactNotFoundError."""
        from core.artifacts.value_objects import ArtifactKey

        key = ArtifactKey("nonexistent/key/file.bin")
        with pytest.raises(ArtifactNotFoundError):
            artifact_store.retrieve(key=key, kind=ArtifactKind.FILE)


class TestExistsAndDelete:
    """Tests for exists and delete operations."""

    def test_exists_true_after_store(
        self, artifact_store, file_hint, sample_content
    ) -> None:
        """Test that exists returns True after storing artifact."""
        ref = artifact_store.store(
            hint=file_hint,
            kind=ArtifactKind.FILE,
            content=sample_content,
            content_type="application/json",
        )
        assert artifact_store.exists(ref.key) is True

    def test_exists_false_before_store(self, artifact_store) -> None:
        """Test that exists returns False for nonexistent artifact."""
        from core.artifacts.value_objects import ArtifactKey

        key = ArtifactKey("nonexistent/key/file.bin")
        assert artifact_store.exists(key) is False

    def test_delete_returns_true(
        self, artifact_store, file_hint, sample_content
    ) -> None:
        """Test that delete returns True and removes existing artifact."""
        ref = artifact_store.store(
            hint=file_hint,
            kind=ArtifactKind.FILE,
            content=sample_content,
            content_type="application/json",
        )
        assert artifact_store.delete(ref.key) is True
        assert artifact_store.exists(ref.key) is False

    def test_delete_returns_false_not_found(self, artifact_store) -> None:
        """Test that delete returns False for nonexistent artifact."""
        from core.artifacts.value_objects import ArtifactKey

        key = ArtifactKey("nonexistent/key/file.bin")
        assert artifact_store.delete(key) is False


class TestValidation:
    """Tests for content validation."""

    def test_disallowed_content_type_raises(
        self, artifact_store, file_hint
    ) -> None:
        """Test that disallowed content type raises ArtifactValidationError."""
        with pytest.raises(ArtifactValidationError, match="not allowed"):
            artifact_store.store(
                hint=file_hint,
                kind=ArtifactKind.FILE,
                content=b"data",
                content_type="image/png",
            )

    def test_oversized_content_raises(self, file_hint) -> None:
        """Test that oversized content raises ArtifactValidationError."""
        store = InMemoryArtifactStore(max_artifact_size_bytes=10)
        with pytest.raises(ArtifactValidationError, match="exceeds maximum"):
            store.store(
                hint=file_hint,
                kind=ArtifactKind.FILE,
                content=b"x" * 11,
                content_type="application/json",
            )


class TestGenerateKey:
    """Tests for deterministic key generation."""

    def test_deterministic_key(self, artifact_store, file_hint) -> None:
        """Test that generate_key returns same key for same hint."""
        key1 = artifact_store.generate_key(file_hint, ArtifactKind.FILE)
        key2 = artifact_store.generate_key(file_hint, ArtifactKind.FILE)
        assert key1 == key2

    def test_different_hints_different_keys(self, artifact_store) -> None:
        """Test that different hints generate different keys."""
        hint1 = StoreHint(namespace="ns", label="a", tags={"k": "v1"})
        hint2 = StoreHint(namespace="ns", label="a", tags={"k": "v2"})
        key1 = artifact_store.generate_key(hint1, ArtifactKind.FILE)
        key2 = artifact_store.generate_key(hint2, ArtifactKind.FILE)
        assert key1 != key2

    def test_file_key_has_bin_extension(self, artifact_store, file_hint) -> None:
        """Test that file keys have .bin extension."""
        key = artifact_store.generate_key(file_hint, ArtifactKind.FILE)
        assert key.value.endswith(".bin")

    def test_archive_key_has_zip_extension(
        self, artifact_store, archive_hint
    ) -> None:
        """Test that archive keys have .zip extension."""
        key = artifact_store.generate_key(archive_hint, ArtifactKind.ARCHIVE)
        assert key.value.endswith(".zip")


================================================
FILE: build_stream/tests/unit/infra/db/test_mappers.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for mappers."""

import pytest
from datetime import datetime, timezone

from core.jobs.entities.audit import AuditEvent
from core.jobs.entities.idempotency import IdempotencyRecord
from core.jobs.entities.job import Job
from core.jobs.entities.stage import Stage
from core.jobs.value_objects import (
    ClientId,
    CorrelationId,
    IdempotencyKey,
    JobId,
    JobState,
    RequestFingerprint,
    StageName,
    StageState,
)
from infra.db.mappers import (
    AuditEventMapper,
    IdempotencyRecordMapper,
    JobMapper,
    StageMapper,
)
from infra.db.models import AuditEventModel, IdempotencyKeyModel, JobModel, StageModel


class TestJobMapper:
    """Test Job entity ↔ JobModel mapping."""

    def test_to_orm(self) -> None:
        """Convert domain entity to ORM model."""
        job = Job(
            job_id=JobId("12345678-1234-5678-9abc-123456789abc"),
            client_id=ClientId("test-client"),
            request_client_id="request-client-123",
            client_name="Test Client",
            job_state=JobState.IN_PROGRESS,
            created_at=datetime(2026, 1, 26, 10, 0, tzinfo=timezone.utc),
            updated_at=datetime(2026, 1, 26, 10, 30, tzinfo=timezone.utc),
            version=2,
            tombstoned=False,
        )

        model = JobMapper.to_orm(job)

        assert model.job_id == "12345678-1234-5678-9abc-123456789abc"
        assert model.client_id == "test-client"
        assert model.request_client_id == "request-client-123"
        assert model.client_name == "Test Client"
        assert model.job_state == "IN_PROGRESS"
        assert model.created_at == datetime(2026, 1, 26, 10, 0, tzinfo=timezone.utc)
        assert model.updated_at == datetime(2026, 1, 26, 10, 30, tzinfo=timezone.utc)
        assert model.version == 2
        assert model.tombstoned is False

    def test_to_domain(self) -> None:
        """Convert ORM model to domain entity."""
        model = JobModel(
            job_id="12345678-1234-5678-9abc-123456789abc",
            client_id="test-client",
            request_client_id="request-client-123",
            client_name="Test Client",
            job_state="IN_PROGRESS",
            created_at=datetime(2026, 1, 26, 10, 0, tzinfo=timezone.utc),
            updated_at=datetime(2026, 1, 26, 10, 30, tzinfo=timezone.utc),
            version=2,
            tombstoned=False,
        )

        job = JobMapper.to_domain(model)

        assert str(job.job_id) == "12345678-1234-5678-9abc-123456789abc"
        assert str(job.client_id) == "test-client"
        assert job.request_client_id == "request-client-123"
        assert job.client_name == "Test Client"
        assert job.job_state == JobState.IN_PROGRESS
        assert job.created_at == datetime(2026, 1, 26, 10, 0, tzinfo=timezone.utc)
        assert job.updated_at == datetime(2026, 1, 26, 10, 30, tzinfo=timezone.utc)
        assert job.version == 2
        assert job.tombstoned is False

    def test_roundtrip(self) -> None:
        """Roundtrip conversion preserves all data."""
        original = Job(
            job_id=JobId("12345678-1234-5678-9abc-123456789abc"),
            client_id=ClientId("test-client"),
            request_client_id="request-client-123",
            client_name=None,  # Test nullable field
            job_state=JobState.COMPLETED,
            created_at=datetime(2026, 1, 26, 10, 0, tzinfo=timezone.utc),
            updated_at=datetime(2026, 1, 26, 11, 0, tzinfo=timezone.utc),
            version=5,
            tombstoned=True,
        )

        model = JobMapper.to_orm(original)
        converted = JobMapper.to_domain(model)

        assert str(converted.job_id) == str(original.job_id)
        assert str(converted.client_id) == str(original.client_id)
        assert converted.request_client_id == original.request_client_id
        assert converted.client_name == original.client_name
        assert converted.job_state == original.job_state
        assert converted.created_at == original.created_at
        assert converted.updated_at == original.updated_at
        assert converted.version == original.version
        assert converted.tombstoned == original.tombstoned


class TestStageMapper:
    """Test Stage entity ↔ StageModel mapping."""

    def test_to_orm(self) -> None:
        """Convert domain entity to ORM model."""
        stage = Stage(
            job_id=JobId("12345678-1234-5678-9abc-123456789abc"),
            stage_name=StageName("parse-catalog"),
            stage_state=StageState.FAILED,
            attempt=2,
            started_at=datetime(2026, 1, 26, 10, 0, tzinfo=timezone.utc),
            ended_at=datetime(2026, 1, 26, 10, 30, tzinfo=timezone.utc),
            error_code="TIMEOUT",
            error_summary="Stage timed out after 30 minutes",
            version=3,
        )

        model = StageMapper.to_orm(stage)

        assert model.job_id == "12345678-1234-5678-9abc-123456789abc"
        assert model.stage_name == "parse-catalog"
        assert model.stage_state == "FAILED"
        assert model.attempt == 2
        assert model.started_at == datetime(2026, 1, 26, 10, 0, tzinfo=timezone.utc)
        assert model.ended_at == datetime(2026, 1, 26, 10, 30, tzinfo=timezone.utc)
        assert model.error_code == "TIMEOUT"
        assert model.error_summary == "Stage timed out after 30 minutes"
        assert model.version == 3

    def test_to_domain(self) -> None:
        """Convert ORM model to domain entity."""
        model = StageModel(
            job_id="12345678-1234-5678-9abc-123456789abc",
            stage_name="parse-catalog",
            stage_state="FAILED",
            attempt=2,
            started_at=datetime(2026, 1, 26, 10, 0, tzinfo=timezone.utc),
            ended_at=datetime(2026, 1, 26, 10, 30, tzinfo=timezone.utc),
            error_code="TIMEOUT",
            error_summary="Stage timed out after 30 minutes",
            version=3,
        )

        stage = StageMapper.to_domain(model)

        assert str(stage.job_id) == "12345678-1234-5678-9abc-123456789abc"
        assert str(stage.stage_name) == "parse-catalog"
        assert stage.stage_state == StageState.FAILED
        assert stage.attempt == 2
        assert stage.started_at == datetime(2026, 1, 26, 10, 0, tzinfo=timezone.utc)
        assert stage.ended_at == datetime(2026, 1, 26, 10, 30, tzinfo=timezone.utc)
        assert stage.error_code == "TIMEOUT"
        assert stage.error_summary == "Stage timed out after 30 minutes"
        assert stage.version == 3


class TestIdempotencyRecordMapper:
    """Test IdempotencyRecord entity ↔ IdempotencyKeyModel mapping."""

    def test_to_orm(self) -> None:
        """Convert domain entity to ORM model."""
        record = IdempotencyRecord(
            idempotency_key=IdempotencyKey("unique-key-123"),
            job_id=JobId("12345678-1234-5678-9abc-123456789abc"),
            request_fingerprint=RequestFingerprint("a" * 64),
            client_id=ClientId("test-client"),
            created_at=datetime(2026, 1, 26, 10, 0, tzinfo=timezone.utc),
            expires_at=datetime(2026, 1, 26, 11, 0, tzinfo=timezone.utc),
        )

        model = IdempotencyRecordMapper.to_orm(record)

        assert model.idempotency_key == "unique-key-123"
        assert model.job_id == "12345678-1234-5678-9abc-123456789abc"
        assert model.request_fingerprint == "a" * 64
        assert model.client_id == "test-client"
        assert model.created_at == datetime(2026, 1, 26, 10, 0, tzinfo=timezone.utc)
        assert model.expires_at == datetime(2026, 1, 26, 11, 0, tzinfo=timezone.utc)


class TestAuditEventMapper:
    """Test AuditEvent entity ↔ AuditEventModel mapping."""

    def test_to_orm_with_details(self) -> None:
        """Convert domain entity to ORM model with details."""
        event = AuditEvent(
            event_id="12345678-1234-5678-9abc-123456789abc",
            job_id=JobId("12345678-1234-5678-9abc-123456789abc"),
            event_type="job_created",
            correlation_id=CorrelationId("87654321-4321-8765-cba9-876543210cba"),
            client_id=ClientId("test-client"),
            timestamp=datetime(2026, 1, 26, 10, 0, tzinfo=timezone.utc),
            details={"stage": "parse-catalog", "duration_ms": 5000},
        )

        model = AuditEventMapper.to_orm(event)

        assert model.event_id == "12345678-1234-5678-9abc-123456789abc"
        assert model.job_id == "12345678-1234-5678-9abc-123456789abc"
        assert model.event_type == "job_created"
        assert model.correlation_id == "87654321-4321-8765-cba9-876543210cba"
        assert model.client_id == "test-client"
        assert model.timestamp == datetime(2026, 1, 26, 10, 0, tzinfo=timezone.utc)
        assert model.details == {"stage": "parse-catalog", "duration_ms": 5000}

    def test_to_orm_without_details(self) -> None:
        """Convert domain entity to ORM model without details."""
        event = AuditEvent(
            event_id="12345678-1234-5678-9abc-123456789abc",
            job_id=JobId("12345678-1234-5678-9abc-123456789abc"),
            event_type="job_created",
            correlation_id=CorrelationId("87654321-4321-8765-cba9-876543210cba"),
            client_id=ClientId("test-client"),
            timestamp=datetime(2026, 1, 26, 10, 0, tzinfo=timezone.utc),
        )

        model = AuditEventMapper.to_orm(event)

        assert model.details is None

    def test_to_domain_with_null_details(self) -> None:
        """Convert ORM model to domain entity with null details."""
        model = AuditEventModel(
            event_id="12345678-1234-5678-9abc-123456789abc",
            job_id="12345678-1234-5678-9abc-123456789abc",
            event_type="job_created",
            correlation_id="87654321-4321-8765-cba9-876543210cba",
            client_id="test-client",
            timestamp=datetime(2026, 1, 26, 10, 0, tzinfo=timezone.utc),
            details=None,
        )

        event = AuditEventMapper.to_domain(model)

        assert event.details == {}


================================================
FILE: build_stream/tests/unit/infra/db/test_repositories_unit.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for SQL repository implementations (without database)."""

import pytest
from unittest.mock import Mock, MagicMock

from core.jobs.entities.job import Job
from core.jobs.exceptions import OptimisticLockError
from core.jobs.value_objects import ClientId, JobId, JobState
from infra.db.models import JobModel
from infra.db.repositories import SqlJobRepository


class TestSqlJobRepositoryUnit:
    """Unit tests for SqlJobRepository using mocks."""

    def test_save_raises_optimistic_lock_error_on_conflict(self) -> None:
        """Test that save raises OptimisticLockError when version conflicts."""
        # Mock session that simulates a version conflict
        mock_session = Mock()
        mock_existing = Mock()
        mock_existing.version = 5  # Different from expected
        
        # Configure get to return existing record
        mock_session.get.return_value = mock_existing
        
        repo = SqlJobRepository(mock_session)
        
        job = Job(
            job_id=JobId("12345678-1234-5678-9abc-123456789abc"),
            client_id=ClientId("test-client"),
            request_client_id="req-123",
            job_state=JobState.IN_PROGRESS,
            version=3,  # Stale version (expected version would be 4)
        )
        
        with pytest.raises(OptimisticLockError) as exc_info:
            repo.save(job)
        
        assert "Version conflict for Job" in str(exc_info.value)
        assert exc_info.value.expected_version == 2  # version - 1
        assert exc_info.value.actual_version == 5

    def test_save_calls_flush(self) -> None:
        """Test that save calls session.flush()."""
        mock_session = Mock()
        mock_session.get.return_value = None  # No existing record
        
        repo = SqlJobRepository(mock_session)
        
        job = Job(
            job_id=JobId("12345678-1234-5678-9abc-123456789abc"),
            client_id=ClientId("test-client"),
            request_client_id="req-123",
        )
        
        repo.save(job)
        
        # Verify flush was called
        mock_session.flush.assert_called_once()

    def test_find_by_id_returns_none_when_not_found(self) -> None:
        """Test that find_by_id returns None when job doesn't exist."""
        mock_session = Mock()
        mock_session.get.return_value = None
        
        repo = SqlJobRepository(mock_session)
        
        result = repo.find_by_id(JobId("12345678-1234-5678-9abc-123456789abc"))
        
        assert result is None
        mock_session.get.assert_called_once_with(JobModel, "12345678-1234-5678-9abc-123456789abc")

    def test_exists_returns_true_when_found(self) -> None:
        """Test that exists returns True when job exists."""
        mock_session = Mock()
        mock_result = Mock()
        mock_result.first.return_value = mock_result
        mock_session.execute.return_value = mock_result
        
        repo = SqlJobRepository(mock_session)
        
        result = repo.exists(JobId("12345678-1234-5678-9abc-123456789abc"))
        
        assert result is True

    def test_exists_returns_false_when_not_found(self) -> None:
        """Test that exists returns False when job doesn't exist."""
        mock_session = Mock()
        mock_result = Mock()
        mock_result.first.return_value = None
        mock_session.execute.return_value = mock_result
        
        repo = SqlJobRepository(mock_session)
        
        result = repo.exists(JobId("87654321-4321-8765-cba9-876543210cba"))
        
        assert result is False


================================================
FILE: build_stream/tests/unit/infra/test_id_generator.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for infrastructure ID generators."""

import uuid

from infra.id_generator import JobUUIDGenerator, UUIDv4Generator


class TestJobUUIDGenerator:
    """Tests covering JobUUIDGenerator behavior (UUID v4 under the hood)."""

    def test_generate_returns_valid_job_id(self) -> None:
        """Generator should produce a JobId string of expected length."""
        generator = JobUUIDGenerator()

        job_id = generator.generate()

        assert isinstance(job_id.value, str)
        assert len(job_id.value) == 36
        # Ensure it parses as a UUID (version-agnostic acceptance)
        uuid_obj = uuid.UUID(job_id.value)
        assert isinstance(uuid_obj, uuid.UUID)

    def test_generate_is_unique(self) -> None:
        """Generator should yield unique IDs over multiple invocations."""
        generator = JobUUIDGenerator()

        generated = {generator.generate().value for _ in range(50)}

        assert len(generated) == 50


class TestUUIDv4Generator:  # pylint: disable=R0903
    """Tests covering generic UUIDv4Generator."""

    def test_generate_returns_uuid_instance(self) -> None:
        """Ensure generator returns a UUID4 instance."""
        generator = UUIDv4Generator()

        value = generator.generate()

        assert isinstance(value, uuid.UUID)
        assert value.version == 4


================================================
FILE: build_stream/tests/unit/infra/test_nfs_input_directory_repository.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for NfsInputDirectoryRepository."""

import uuid
from pathlib import Path
from unittest.mock import MagicMock, patch

import pytest

from core.jobs.value_objects import JobId
from infra.repositories.nfs_input_repository import (
    NfsInputRepository,
)


class TestNfsInputRepository:
    """Tests for NfsInputRepository."""

    @pytest.fixture
    def repository(self):
        """Create repository instance."""
        return NfsInputRepository()

    @pytest.fixture
    def job_id(self):
        """Provide a valid job ID."""
        return JobId(str(uuid.uuid4()))

    def test_get_source_input_repository_path(self, repository, job_id):
        """Test getting source input repository path."""
        path = repository.get_source_input_repository_path(str(job_id))

        expected = Path(f"/opt/omnia/build_stream_root/{job_id}/input")
        assert path == expected
        assert isinstance(path, Path)

    def test_get_destination_input_repository_path(self, repository):
        """Test getting destination input repository path."""
        path = repository.get_destination_input_repository_path()

        expected = Path("/opt/omnia/input/project_default/")
        assert path == expected
        assert isinstance(path, Path)

    def test_validate_input_directory_success(self, repository, tmp_path):
        """Test successful validation of input directory."""
        # Create required files
        (tmp_path / "omnia.yml").touch()
        (tmp_path / "devices.yml").touch()
        (tmp_path / "network.yml").touch()

        result = repository.validate_input_directory(tmp_path)

        assert result is True

    def test_validate_input_directory_missing_files(self, repository, tmp_path):
        """Test validation fails when directory is empty."""
        # Create no files

        result = repository.validate_input_directory(tmp_path)

        assert result is False

    def test_validate_input_directory_nonexistent(self, repository):
        """Test validation fails for non-existent directory."""
        nonexistent_path = Path("/nonexistent/path")

        result = repository.validate_input_directory(nonexistent_path)

        assert result is False

    def test_validate_input_directory_not_a_directory(self, repository, tmp_path):
        """Test validation fails when path is not a directory."""
        # Create a file instead of directory
        file_path = tmp_path / "not_a_directory.txt"
        file_path.touch()

        result = repository.validate_input_directory(file_path)

        assert result is False

    def test_validate_input_directory_empty(self, repository, tmp_path):
        """Test validation fails for empty directory."""
        # Directory exists but is empty
        assert tmp_path.exists()
        assert len(list(tmp_path.iterdir())) == 0

        result = repository.validate_input_directory(tmp_path)

        assert result is False

    def test_validate_input_directory_with_subdirs(self, repository, tmp_path):
        """Test validation works with subdirectories present."""
        # Create required files
        (tmp_path / "omnia.yml").touch()
        (tmp_path / "devices.yml").touch()
        (tmp_path / "network.yml").touch()

        # Create subdirectories (should not affect validation)
        (tmp_path / "subdir").mkdir()
        (tmp_path / "subdir" / "extra_file.txt").touch()

        result = repository.validate_input_directory(tmp_path)

        assert result is True

    def test_validate_input_directory_permission_error(self, repository):
        """Test validation handles permission errors gracefully."""
        # Use a non-existent path to simulate permission error
        nonexistent_path = Path("/root/nonexistent/path")

        result = repository.validate_input_directory(nonexistent_path)

        assert result is False

    def test_custom_base_paths(self):
        """Test repository with custom base paths."""
        custom_build_stream_base = "/custom/build_stream"
        custom_playbook_input_dir = "/custom/input"

        repo = NfsInputRepository(
            build_stream_base=custom_build_stream_base,
            playbook_input_dir=custom_playbook_input_dir,
        )

        job_id = JobId(str(uuid.uuid4()))

        source_path = repo.get_source_input_repository_path(str(job_id))
        assert source_path == Path(f"{custom_build_stream_base}/{job_id}/input")

        dest_path = repo.get_destination_input_repository_path()
        assert dest_path == Path(custom_playbook_input_dir)


================================================
FILE: build_stream/tests/unit/infra/test_nfs_playbook_queue_result_service.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for PlaybookQueueResultService."""

import json
import uuid
from pathlib import Path
from unittest.mock import MagicMock, patch

import pytest

from core.localrepo.entities import PlaybookResult
from core.localrepo.repositories import PlaybookQueueResultRepository
from core.localrepo.services import PlaybookQueueResultService


class TestPlaybookQueueResultService:
    """Tests for PlaybookQueueResultService."""

    @pytest.fixture
    def mock_result_repo(self):
        """Mock result repository."""
        return MagicMock(spec=PlaybookQueueResultRepository)

    @pytest.fixture
    def result_service(self, mock_result_repo):
        """Create result service with mocked repository."""
        return PlaybookQueueResultService(mock_result_repo)

    @pytest.fixture
    def result_file_content(self):
        """Sample result file content."""
        return {
            "job_id": str(uuid.uuid4()),
            "stage_name": "create-local-repository",
            "request_id": str(uuid.uuid4()),
            "status": "success",
            "exit_code": 0,
            "duration_seconds": 30,
        }

    def test_poll_results_no_files(self, result_service, mock_result_repo):
        """Test polling when no result files exist."""
        callback = MagicMock()
        mock_result_repo.is_available.return_value = True
        mock_result_repo.get_unprocessed_results.return_value = []

        count = result_service.poll_results(callback=callback)

        assert count == 0
        callback.assert_not_called()
        mock_result_repo.get_unprocessed_results.assert_called_once()

    def test_poll_results_with_files(self, result_service, mock_result_repo, result_file_content):
        """Test polling with result files."""
        # Setup mock
        result_path1 = Path("/queue/result1.json")
        result_path2 = Path("/queue/result2.json")

        mock_result_repo.is_available.return_value = True
        mock_result_repo.get_unprocessed_results.return_value = [result_path1, result_path2]

        # Create mock results
        result1 = PlaybookResult(**result_file_content)
        result2 = PlaybookResult(**result_file_content)

        mock_result_repo.read_result.side_effect = [result1, result2]

        callback = MagicMock()

        count = result_service.poll_results(callback=callback)

        assert count == 2
        assert callback.call_count == 2
        callback.assert_any_call(result1)
        callback.assert_any_call(result2)
        mock_result_repo.archive_result.assert_any_call(result_path1)
        mock_result_repo.archive_result.assert_any_call(result_path2)

    def test_poll_results_repo_unavailable(self, result_service, mock_result_repo):
        """Test polling when repository is unavailable."""
        callback = MagicMock()
        mock_result_repo.is_available.return_value = False

        count = result_service.poll_results(callback=callback)

        assert count == 0
        callback.assert_not_called()
        mock_result_repo.get_unprocessed_results.assert_not_called()

    def test_poll_results_callback_exception(self, result_service, mock_result_repo, result_file_content):
        """Test polling when callback raises exception."""
        result_path = Path("/queue/result1.json")

        mock_result_repo.is_available.return_value = True
        mock_result_repo.get_unprocessed_results.return_value = [result_path]

        result = PlaybookResult(**result_file_content)
        mock_result_repo.read_result.return_value = result

        callback = MagicMock(side_effect=Exception("Callback error"))

        # Should not raise exception
        count = result_service.poll_results(callback=callback)

        assert count == 0  # No files processed due to error
        mock_result_repo.archive_result.assert_not_called()

    def test_poll_results_read_exception(self, result_service, mock_result_repo):
        """Test polling when reading result fails."""
        result_path = Path("/queue/result1.json")

        mock_result_repo.is_available.return_value = True
        mock_result_repo.get_unprocessed_results.return_value = [result_path]
        mock_result_repo.read_result.side_effect = Exception("Read error")

        callback = MagicMock()

        # Should not raise exception
        count = result_service.poll_results(callback=callback)

        assert count == 0  # No files processed due to error
        callback.assert_not_called()
        mock_result_repo.archive_result.assert_not_called()


================================================
FILE: build_stream/tests/unit/infra/test_nfs_repositories.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for NFS repository implementations."""

import json
from pathlib import Path

import pytest

from core.localrepo.entities import PlaybookRequest, PlaybookResult
from core.localrepo.exceptions import QueueUnavailableError
from core.localrepo.value_objects import (
    ExecutionTimeout,
    ExtraVars,
    PlaybookPath,
)
from infra.repositories.nfs_input_repository import (
    NfsInputRepository,
)
from infra.repositories.nfs_playbook_queue_request_repository import (
    NfsPlaybookQueueRequestRepository,
)
from infra.repositories.nfs_playbook_queue_result_repository import (
    NfsPlaybookQueueResultRepository,
)


class TestNfsPlaybookQueueRequestRepository:
    """Tests for NfsPlaybookQueueRequestRepository."""

    def _make_request(self):
        """Helper to create a PlaybookRequest."""
        return PlaybookRequest(
            job_id="018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11",
            stage_name="create-local-repository",
            playbook_path=PlaybookPath("local_repo.yml"),
            extra_vars=ExtraVars(values={}),
            correlation_id="019bf590-1234-7890-abcd-ef1234567890",
            timeout=ExecutionTimeout.default(),
            submitted_at="2026-02-05T14:30:00Z",
            request_id="req-001",
        )

    def test_write_request_creates_file(self, tmp_path):
        """write_request should create a JSON file in requests dir."""
        repo = NfsPlaybookQueueRequestRepository(
            queue_base_path=str(tmp_path)
        )
        repo.ensure_directories()

        request = self._make_request()
        file_path = repo.write_request(request)

        assert file_path.exists()
        with open(file_path, "r", encoding="utf-8") as fobj:
            data = json.load(fobj)
        assert data["job_id"] == "018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11"
        assert data["stage_name"] == "create-local-repository"

    def test_is_available_true(self, tmp_path):
        """is_available should return True when directory exists."""
        repo = NfsPlaybookQueueRequestRepository(
            queue_base_path=str(tmp_path)
        )
        repo.ensure_directories()
        assert repo.is_available() is True

    def test_is_available_false(self):
        """is_available should return False when directory missing."""
        repo = NfsPlaybookQueueRequestRepository(
            queue_base_path="/nonexistent/path"
        )
        assert repo.is_available() is False

    def test_write_request_unavailable_raises(self):
        """write_request on unavailable queue should raise."""
        repo = NfsPlaybookQueueRequestRepository(
            queue_base_path="/nonexistent/path"
        )
        with pytest.raises(QueueUnavailableError):
            repo.write_request(self._make_request())

    def test_file_permissions(self, tmp_path):
        """Written file should have restricted permissions."""
        import os
        import stat

        repo = NfsPlaybookQueueRequestRepository(
            queue_base_path=str(tmp_path)
        )
        repo.ensure_directories()

        file_path = repo.write_request(self._make_request())
        mode = os.stat(file_path).st_mode
        assert mode & stat.S_IRUSR  # owner read
        assert mode & stat.S_IWUSR  # owner write
        assert not (mode & stat.S_IROTH)  # no other read


class TestNfsPlaybookQueueResultRepository:
    """Tests for NfsPlaybookQueueResultRepository."""

    def _write_result_file(self, results_dir, filename, data):
        """Helper to write a result JSON file."""
        file_path = results_dir / filename
        with open(file_path, "w", encoding="utf-8") as fobj:
            json.dump(data, fobj)
        return file_path

    def test_get_unprocessed_results(self, tmp_path):
        """Should return list of unprocessed result files."""
        repo = NfsPlaybookQueueResultRepository(
            queue_base_path=str(tmp_path)
        )
        repo.ensure_directories()

        results_dir = tmp_path / "results"
        self._write_result_file(
            results_dir,
            "job1_create-local-repository_20260205.json",
            {"job_id": "job-1", "stage_name": "create-local-repository", "status": "success"},
        )

        files = repo.get_unprocessed_results()
        assert len(files) == 1

    def test_read_result_valid(self, tmp_path):
        """Should parse valid result file."""
        repo = NfsPlaybookQueueResultRepository(
            queue_base_path=str(tmp_path)
        )
        repo.ensure_directories()

        results_dir = tmp_path / "results"
        file_path = self._write_result_file(
            results_dir,
            "result.json",
            {
                "job_id": "job-1",
                "stage_name": "create-local-repository",
                "status": "success",
                "exit_code": 0,
            },
        )

        result = repo.read_result(file_path)
        assert result.job_id == "job-1"
        assert result.is_success is True

    def test_read_result_invalid_json(self, tmp_path):
        """Should raise ValueError for invalid JSON."""
        repo = NfsPlaybookQueueResultRepository(
            queue_base_path=str(tmp_path)
        )
        repo.ensure_directories()

        results_dir = tmp_path / "results"
        bad_file = results_dir / "bad.json"
        bad_file.write_text("not json")

        with pytest.raises(ValueError, match="Invalid JSON"):
            repo.read_result(bad_file)

    def test_read_result_missing_fields(self, tmp_path):
        """Should raise ValueError for missing required fields."""
        repo = NfsPlaybookQueueResultRepository(
            queue_base_path=str(tmp_path)
        )
        repo.ensure_directories()

        results_dir = tmp_path / "results"
        file_path = self._write_result_file(
            results_dir,
            "incomplete.json",
            {"stage_name": "create-local-repository"},
        )

        with pytest.raises(ValueError, match="missing required fields"):
            repo.read_result(file_path)

    def test_archive_result(self, tmp_path):
        """Should move result file to archive directory."""
        repo = NfsPlaybookQueueResultRepository(
            queue_base_path=str(tmp_path)
        )
        repo.ensure_directories()

        results_dir = tmp_path / "results"
        file_path = self._write_result_file(
            results_dir,
            "result.json",
            {"job_id": "job-1", "stage_name": "test", "status": "success"},
        )

        repo.archive_result(file_path)

        assert not file_path.exists()
        archive_path = tmp_path / "archive" / "results" / "result.json"
        assert archive_path.exists()

    def test_is_available_true(self, tmp_path):
        """is_available should return True when directory exists."""
        repo = NfsPlaybookQueueResultRepository(
            queue_base_path=str(tmp_path)
        )
        repo.ensure_directories()
        assert repo.is_available() is True

    def test_is_available_false(self):
        """is_available should return False when directory missing."""
        repo = NfsPlaybookQueueResultRepository(
            queue_base_path="/nonexistent/path"
        )
        assert repo.is_available() is False

    def test_clear_processed_cache(self, tmp_path):
        """clear_processed_cache should reset the in-memory set."""
        repo = NfsPlaybookQueueResultRepository(
            queue_base_path=str(tmp_path)
        )
        repo.ensure_directories()

        results_dir = tmp_path / "results"
        file_path = self._write_result_file(
            results_dir,
            "result.json",
            {"job_id": "job-1", "stage_name": "test", "status": "success"},
        )
        repo.archive_result(file_path)
        assert "result.json" in repo._processed_files

        repo.clear_processed_cache()
        assert len(repo._processed_files) == 0


class TestNfsInputRepository:
    """Tests for NfsInputRepository."""

    def test_get_source_path(self):
        """Should return correct source path for job."""
        repo = NfsInputRepository(
            build_stream_base="/opt/omnia/build_stream"
        )
        path = repo.get_source_input_repository_path("job-123")
        assert path == Path("/opt/omnia/build_stream/job-123/input")

    def test_get_destination_path(self):
        """Should return correct destination path."""
        repo = NfsInputRepository(
            playbook_input_dir="/opt/omnia/input/project_build_stream"
        )
        path = repo.get_destination_input_repository_path()
        assert path == Path("/opt/omnia/input/project_build_stream")

    def test_validate_existing_directory(self, tmp_path):
        """Should return True for directory with files."""
        input_dir = tmp_path / "input"
        input_dir.mkdir()
        (input_dir / "config.json").write_text("{}")

        repo = NfsInputRepository(
            build_stream_base=str(tmp_path)
        )
        assert repo.validate_input_directory(input_dir) is True

    def test_validate_nonexistent_directory(self):
        """Should return False for nonexistent directory."""
        repo = NfsInputRepository()
        assert repo.validate_input_directory(Path("/nonexistent")) is False

    def test_validate_empty_directory(self, tmp_path):
        """Should return False for empty directory."""
        empty_dir = tmp_path / "empty"
        empty_dir.mkdir()

        repo = NfsInputRepository()
        assert repo.validate_input_directory(empty_dir) is False


================================================
FILE: build_stream/tests/unit/orchestrator/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Orchestrator layer tests."""


================================================
FILE: build_stream/tests/unit/orchestrator/build_image/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


================================================
FILE: build_stream/tests/unit/orchestrator/build_image/test_create_build_image_use_case.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for CreateBuildImageUseCase."""

import uuid

import pytest

from core.build_image.entities import BuildImageRequest
from core.build_image.exceptions import InventoryHostMissingError
from core.build_image.value_objects import Architecture, InventoryHost
from core.jobs.entities import Stage
from core.jobs.exceptions import JobNotFoundError
from core.jobs.value_objects import (
    ClientId, CorrelationId, JobId, StageName, StageState, StageType,
)
from orchestrator.build_image.commands import CreateBuildImageCommand
from orchestrator.build_image.use_cases import CreateBuildImageUseCase


def _uuid():
    """Generate a valid UUID string."""
    return str(uuid.uuid4())


class MockJobRepository:
    """Mock job repository."""

    def __init__(self, job=None):
        """Initialize mock with job data."""
        self.job = job
        self.saved_jobs = []

    def find_by_id(self, job_id):
        """Return mock job or None."""
        return self.job

    def save(self, job):
        """Save job."""
        self.saved_jobs.append(job)


class MockStageRepository:
    """Mock stage repository."""

    def __init__(self, stages=None):
        """Initialize mock with stage data."""
        self._stages = stages or {}
        self.saved_stages = []

    def find_by_job_and_name(self, job_id, stage_name):
        """Return mock stage by name."""
        return self._stages.get(stage_name.value)

    def save(self, stage):
        """Save stage."""
        self.saved_stages.append(stage)


class MockAuditRepository:
    """Mock audit repository."""

    def __init__(self):
        """Initialize mock."""
        self.saved_events = []

    def save(self, event):
        """Save audit event."""
        self.saved_events.append(event)


class MockConfigService:
    """Mock build image config service."""

    def __init__(self, inventory_host=None, should_fail=False):
        """Initialize mock."""
        self.inventory_host = inventory_host
        self.should_fail = should_fail

    def get_inventory_host(self, job_id, architecture, correlation_id):
        """Return inventory host or raise error."""
        if self.should_fail:
            raise InventoryHostMissingError("Config error", correlation_id)
        return self.inventory_host


class MockQueueService:
    """Mock build image queue service."""

    def __init__(self):
        """Initialize mock."""
        self.submitted_requests = []

    def submit_request(self, request, correlation_id):
        """Submit request."""
        self.submitted_requests.append((request, correlation_id))


class MockInventoryRepo:
    """Mock inventory repository."""

    def __init__(self):
        """Initialize mock."""
        self.created_files = []

    def create_inventory_file(self, inventory_host, job_id):
        """Create mock inventory file."""
        self.created_files.append((inventory_host, job_id))
        return f"/opt/omnia/build_stream_inv/{job_id}/inventory"


class MockUUIDGenerator:
    """Mock UUID generator."""

    def __init__(self):
        """Initialize mock."""

    def generate(self):
        """Generate mock UUID."""
        return uuid.uuid4()


class TestCreateBuildImageUseCase:
    """Test cases for CreateBuildImageUseCase."""

    @pytest.fixture
    def job_id(self):
        """Generate a valid job ID."""
        return JobId(_uuid())

    @pytest.fixture
    def client_id(self):
        """Generate a valid client ID."""
        return ClientId("test-client")

    @pytest.fixture
    def correlation_id(self):
        """Generate a valid correlation ID."""
        return CorrelationId(_uuid())

    @pytest.fixture
    def mock_job(self, client_id):
        """Create a mock job."""
        job = type('Job', (), {})()
        job.client_id = client_id
        job.tombstoned = False
        return job

    @pytest.fixture
    def x86_stage(self, job_id):
        """Create a PENDING build-image-x86_64 stage."""
        return Stage(
            job_id=job_id,
            stage_name=StageName(StageType.BUILD_IMAGE_X86_64.value),
        )

    @pytest.fixture
    def aarch64_stage(self, job_id):
        """Create a PENDING build-image-aarch64 stage."""
        return Stage(
            job_id=job_id,
            stage_name=StageName(StageType.BUILD_IMAGE_AARCH64.value),
        )

    @pytest.fixture
    def upstream_completed_stage(self, job_id):
        """Create a COMPLETED create-local-repository stage."""
        stage = Stage(
            job_id=job_id,
            stage_name=StageName(StageType.CREATE_LOCAL_REPOSITORY.value),
        )
        stage.start()
        stage.complete()
        return stage

    @pytest.fixture
    def use_case_x86(self, mock_job, job_id, x86_stage, upstream_completed_stage):
        """Create use case for x86_64 tests."""
        stages = {
            StageType.BUILD_IMAGE_X86_64.value: x86_stage,
            StageType.CREATE_LOCAL_REPOSITORY.value: upstream_completed_stage,
        }
        return CreateBuildImageUseCase(
            job_repo=MockJobRepository(job=mock_job),
            stage_repo=MockStageRepository(stages=stages),
            audit_repo=MockAuditRepository(),
            config_service=MockConfigService(),
            queue_service=MockQueueService(),
            inventory_repo=MockInventoryRepo(),
            uuid_generator=MockUUIDGenerator(),
        )

    def test_execute_success_x86_64(self, use_case_x86, job_id, client_id, correlation_id):
        """Test successful execution for x86_64."""
        command = CreateBuildImageCommand(
            job_id=job_id,
            client_id=client_id,
            correlation_id=correlation_id,
            architecture="x86_64",
            image_key="test-image",
            functional_groups=["group1", "group2"],
        )

        result = use_case_x86.execute(command)

        assert result.job_id == str(job_id)
        assert result.stage_name == StageType.BUILD_IMAGE_X86_64.value
        assert result.status == "accepted"
        assert result.architecture == "x86_64"
        assert result.image_key == "test-image"
        assert result.functional_groups == ["group1", "group2"]

    def test_execute_success_aarch64_with_host(
        self, mock_job, job_id, client_id, correlation_id,
        aarch64_stage, upstream_completed_stage,
    ):
        """Test successful execution for aarch64 with inventory host."""
        stages = {
            StageType.BUILD_IMAGE_AARCH64.value: aarch64_stage,
            StageType.CREATE_LOCAL_REPOSITORY.value: upstream_completed_stage,
        }
        use_case = CreateBuildImageUseCase(
            job_repo=MockJobRepository(job=mock_job),
            stage_repo=MockStageRepository(stages=stages),
            audit_repo=MockAuditRepository(),
            config_service=MockConfigService(
                inventory_host=InventoryHost("192.168.1.100")
            ),
            queue_service=MockQueueService(),
            inventory_repo=MockInventoryRepo(),
            uuid_generator=MockUUIDGenerator(),
        )

        command = CreateBuildImageCommand(
            job_id=job_id,
            client_id=client_id,
            correlation_id=correlation_id,
            architecture="aarch64",
            image_key="test-image",
            functional_groups=["group1"],
        )

        result = use_case.execute(command)
        assert result.architecture == "aarch64"
        assert result.functional_groups == ["group1"]

    def test_execute_job_not_found(self, job_id, client_id, correlation_id):
        """Test execution when job is not found."""
        use_case = CreateBuildImageUseCase(
            job_repo=MockJobRepository(job=None),
            stage_repo=MockStageRepository(),
            audit_repo=MockAuditRepository(),
            config_service=MockConfigService(),
            queue_service=MockQueueService(),
            inventory_repo=MockInventoryRepo(),
            uuid_generator=MockUUIDGenerator(),
        )

        command = CreateBuildImageCommand(
            job_id=job_id,
            client_id=client_id,
            correlation_id=correlation_id,
            architecture="x86_64",
            image_key="test-image",
            functional_groups=["group1"],
        )

        with pytest.raises(JobNotFoundError):
            use_case.execute(command)

    def test_execute_stage_not_found(
        self, mock_job, job_id, client_id, correlation_id, upstream_completed_stage,
    ):
        """Test execution when stage is not found."""
        stages = {
            StageType.CREATE_LOCAL_REPOSITORY.value: upstream_completed_stage,
        }
        use_case = CreateBuildImageUseCase(
            job_repo=MockJobRepository(job=mock_job),
            stage_repo=MockStageRepository(stages=stages),
            audit_repo=MockAuditRepository(),
            config_service=MockConfigService(),
            queue_service=MockQueueService(),
            inventory_repo=MockInventoryRepo(),
            uuid_generator=MockUUIDGenerator(),
        )

        command = CreateBuildImageCommand(
            job_id=job_id,
            client_id=client_id,
            correlation_id=correlation_id,
            architecture="x86_64",
            image_key="test-image",
            functional_groups=["group1"],
        )

        with pytest.raises(Exception):
            use_case.execute(command)

    def test_execute_invalid_architecture(self, use_case_x86, job_id, client_id, correlation_id):
        """Test execution with invalid architecture."""
        command = CreateBuildImageCommand(
            job_id=job_id,
            client_id=client_id,
            correlation_id=correlation_id,
            architecture="invalid",
            image_key="test-image",
            functional_groups=["group1"],
        )

        with pytest.raises(Exception):
            use_case_x86.execute(command)

    def test_execute_aarch64_missing_inventory_host(
        self, mock_job, job_id, client_id, correlation_id,
        aarch64_stage, upstream_completed_stage,
    ):
        """Test aarch64 execution with missing inventory host."""
        stages = {
            StageType.BUILD_IMAGE_AARCH64.value: aarch64_stage,
            StageType.CREATE_LOCAL_REPOSITORY.value: upstream_completed_stage,
        }
        use_case = CreateBuildImageUseCase(
            job_repo=MockJobRepository(job=mock_job),
            stage_repo=MockStageRepository(stages=stages),
            audit_repo=MockAuditRepository(),
            config_service=MockConfigService(should_fail=True),
            queue_service=MockQueueService(),
            inventory_repo=MockInventoryRepo(),
            uuid_generator=MockUUIDGenerator(),
        )

        command = CreateBuildImageCommand(
            job_id=job_id,
            client_id=client_id,
            correlation_id=correlation_id,
            architecture="aarch64",
            image_key="test-image",
            functional_groups=["group1"],
        )

        with pytest.raises(InventoryHostMissingError):
            use_case.execute(command)

    def test_execute_emits_audit_event(self, use_case_x86, job_id, client_id, correlation_id):
        """Test that execution emits audit event."""
        command = CreateBuildImageCommand(
            job_id=job_id,
            client_id=client_id,
            correlation_id=correlation_id,
            architecture="x86_64",
            image_key="test-image",
            functional_groups=["group1"],
        )

        use_case_x86.execute(command)

        assert len(use_case_x86._audit_repo.saved_events) == 1
        event = use_case_x86._audit_repo.saved_events[0]
        assert event.event_type == "STAGE_STARTED"
        assert event.details["stage_name"] == StageType.BUILD_IMAGE_X86_64.value
        assert event.details["architecture"] == "x86_64"
        assert event.details["image_key"] == "test-image"

    def test_execute_submits_to_queue(self, use_case_x86, job_id, client_id, correlation_id):
        """Test that execution submits request to queue."""
        command = CreateBuildImageCommand(
            job_id=job_id,
            client_id=client_id,
            correlation_id=correlation_id,
            architecture="x86_64",
            image_key="test-image",
            functional_groups=["group1"],
        )

        use_case_x86.execute(command)

        assert len(use_case_x86._queue_service.submitted_requests) == 1
        request, _ = use_case_x86._queue_service.submitted_requests[0]
        assert isinstance(request, BuildImageRequest)
        assert request.job_id == str(job_id)

    def test_execute_starts_stage(self, use_case_x86, job_id, client_id, correlation_id):
        """Test that execution starts the stage."""
        command = CreateBuildImageCommand(
            job_id=job_id,
            client_id=client_id,
            correlation_id=correlation_id,
            architecture="x86_64",
            image_key="test-image",
            functional_groups=["group1"],
        )

        use_case_x86.execute(command)

        assert len(use_case_x86._stage_repo.saved_stages) >= 1
        saved_stage = use_case_x86._stage_repo.saved_stages[0]
        assert saved_stage.stage_state == StageState.IN_PROGRESS


================================================
FILE: build_stream/tests/unit/orchestrator/catalog/conftest.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Shared fixtures for catalog orchestrator tests."""

import uuid
from datetime import datetime, timezone

import pytest

from core.jobs.entities import Job, Stage
from core.jobs.value_objects import (
    ClientId,
    CorrelationId,
    JobId,
    JobState,
    StageName,
    StageState,
    StageType,
)
from infra.artifact_store.in_memory_artifact_store import InMemoryArtifactStore
from infra.artifact_store.in_memory_artifact_metadata import (
    InMemoryArtifactMetadataRepository,
)
from infra.repositories import (
    InMemoryAuditEventRepository,
    InMemoryJobRepository,
    InMemoryStageRepository,
)


VALID_JOB_ID = "018f3c4b-7b5b-7a9d-b6c4-9f3b4f9b2c10"
VALID_CORRELATION_ID = "018f3c4b-2d9e-7d1a-8a2b-111111111111"


class FakeUUIDGenerator:
    """Deterministic UUID generator for tests."""

    def __init__(self) -> None:
        self._counter = 0

    def generate(self) -> uuid.UUID:
        self._counter += 1
        return uuid.UUID(f"00000000-0000-4000-8000-{self._counter:012d}")


@pytest.fixture
def job_id() -> JobId:
    return JobId(VALID_JOB_ID)


@pytest.fixture
def correlation_id() -> CorrelationId:
    return CorrelationId(VALID_CORRELATION_ID)


@pytest.fixture
def job_repo() -> InMemoryJobRepository:
    return InMemoryJobRepository()


@pytest.fixture
def stage_repo() -> InMemoryStageRepository:
    return InMemoryStageRepository()


@pytest.fixture
def audit_repo() -> InMemoryAuditEventRepository:
    return InMemoryAuditEventRepository()


@pytest.fixture
def artifact_store() -> InMemoryArtifactStore:
    return InMemoryArtifactStore()


@pytest.fixture
def artifact_metadata_repo() -> InMemoryArtifactMetadataRepository:
    return InMemoryArtifactMetadataRepository()


@pytest.fixture
def uuid_generator() -> FakeUUIDGenerator:
    return FakeUUIDGenerator()


@pytest.fixture
def created_job(job_id) -> Job:
    """A job in CREATED state."""
    return Job(
        job_id=job_id,
        client_id=ClientId("test-client"),
        request_client_id="test-client",
    )


@pytest.fixture
def in_progress_job(job_id) -> Job:
    """A job in IN_PROGRESS state."""
    job = Job(
        job_id=job_id,
        client_id=ClientId("test-client"),
        request_client_id="test-client",
    )
    job.start()
    return job


@pytest.fixture
def parse_catalog_stage(job_id) -> Stage:
    """A parse-catalog stage in PENDING state."""
    return Stage(
        job_id=job_id,
        stage_name=StageName(StageType.PARSE_CATALOG.value),
        stage_state=StageState.PENDING,
    )


@pytest.fixture
def completed_parse_catalog_stage(job_id) -> Stage:
    """A parse-catalog stage in COMPLETED state."""
    stage = Stage(
        job_id=job_id,
        stage_name=StageName(StageType.PARSE_CATALOG.value),
        stage_state=StageState.PENDING,
    )
    stage.start()
    stage.complete()
    return stage


@pytest.fixture
def generate_input_files_stage(job_id) -> Stage:
    """A generate-input-files stage in PENDING state."""
    return Stage(
        job_id=job_id,
        stage_name=StageName(StageType.GENERATE_INPUT_FILES.value),
        stage_state=StageState.PENDING,
    )


================================================
FILE: build_stream/tests/unit/orchestrator/catalog/test_generate_input_files_command.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for GenerateInputFilesCommand."""

from dataclasses import FrozenInstanceError
from pathlib import Path

import pytest

from core.artifacts.value_objects import SafePath
from core.jobs.value_objects import CorrelationId, JobId
from orchestrator.catalog.commands.generate_input_files import GenerateInputFilesCommand


VALID_JOB_ID = "018f3c4b-7b5b-7a9d-b6c4-9f3b4f9b2c10"
VALID_CORRELATION_ID = "018f3c4b-2d9e-7d1a-8a2b-111111111111"


class TestGenerateInputFilesCommand:
    """Tests for GenerateInputFilesCommand value object."""

    def test_valid_command_without_adapter_policy(self) -> None:
        cmd = GenerateInputFilesCommand(
            job_id=JobId(VALID_JOB_ID),
            correlation_id=CorrelationId(VALID_CORRELATION_ID),
            adapter_policy_path=None,
        )
        assert cmd.job_id.value == VALID_JOB_ID
        assert cmd.correlation_id.value == VALID_CORRELATION_ID
        assert cmd.adapter_policy_path is None

    def test_valid_command_with_adapter_policy(self) -> None:
        policy_path = SafePath.from_string("/opt/omnia/policy.json")
        cmd = GenerateInputFilesCommand(
            job_id=JobId(VALID_JOB_ID),
            correlation_id=CorrelationId(VALID_CORRELATION_ID),
            adapter_policy_path=policy_path,
        )
        assert cmd.job_id.value == VALID_JOB_ID
        assert cmd.correlation_id.value == VALID_CORRELATION_ID
        assert cmd.adapter_policy_path == policy_path
        assert str(cmd.adapter_policy_path.value) == "/opt/omnia/policy.json"

    def test_immutable(self) -> None:
        cmd = GenerateInputFilesCommand(
            job_id=JobId(VALID_JOB_ID),
            correlation_id=CorrelationId(VALID_CORRELATION_ID),
            adapter_policy_path=None,
        )
        with pytest.raises(FrozenInstanceError):
            cmd.adapter_policy_path = SafePath.from_string("/other/path")  # type: ignore[misc]

    def test_equality_based_on_values(self) -> None:
        policy_path = SafePath.from_string("/opt/omnia/policy.json")
        
        cmd1 = GenerateInputFilesCommand(
            job_id=JobId(VALID_JOB_ID),
            correlation_id=CorrelationId(VALID_CORRELATION_ID),
            adapter_policy_path=policy_path,
        )
        
        cmd2 = GenerateInputFilesCommand(
            job_id=JobId(VALID_JOB_ID),
            correlation_id=CorrelationId(VALID_CORRELATION_ID),
            adapter_policy_path=policy_path,
        )
        
        assert cmd1 == cmd2
        assert hash(cmd1) == hash(cmd2)

    def test_inequality_with_different_values(self) -> None:
        policy_path1 = SafePath.from_string("/opt/omnia/policy1.json")
        policy_path2 = SafePath.from_string("/opt/omnia/policy2.json")
        
        cmd1 = GenerateInputFilesCommand(
            job_id=JobId(VALID_JOB_ID),
            correlation_id=CorrelationId(VALID_CORRELATION_ID),
            adapter_policy_path=policy_path1,
        )
        
        cmd2 = GenerateInputFilesCommand(
            job_id=JobId(VALID_JOB_ID),
            correlation_id=CorrelationId(VALID_CORRELATION_ID),
            adapter_policy_path=policy_path2,
        )
        
        assert cmd1 != cmd2
        assert hash(cmd1) != hash(cmd2)

    def test_string_representation(self) -> None:
        policy_path = SafePath.from_string("/opt/omnia/policy.json")
        cmd = GenerateInputFilesCommand(
            job_id=JobId(VALID_JOB_ID),
            correlation_id=CorrelationId(VALID_CORRELATION_ID),
            adapter_policy_path=policy_path,
        )
        
        str_repr = str(cmd)
        assert VALID_JOB_ID in str_repr
        assert VALID_CORRELATION_ID in str_repr
        assert "/opt/omnia/policy.json" in str_repr


================================================
FILE: build_stream/tests/unit/orchestrator/catalog/test_generate_input_files_use_case.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for GenerateInputFilesUseCase."""

import json
import os
from pathlib import Path
from unittest.mock import patch

import pytest

from core.artifacts.entities import ArtifactRecord
from core.artifacts.exceptions import ArtifactNotFoundError
from core.artifacts.value_objects import (
    ArtifactKind,
    SafePath,
    StoreHint,
)
from core.catalog.exceptions import ConfigGenerationError
from core.jobs.exceptions import (
    JobNotFoundError,
    StageAlreadyCompletedError,
    TerminalStateViolationError,
    UpstreamStageNotCompletedError,
)
from core.jobs.value_objects import (
    CorrelationId,
    JobId,
    StageName,
    StageState,
    StageType,
)
from orchestrator.catalog.commands.generate_input_files import (
    GenerateInputFilesCommand,
)
from orchestrator.catalog.use_cases.generate_input_files import (
    GenerateInputFilesUseCase,
)


VALID_JOB_ID = "018f3c4b-7b5b-7a9d-b6c4-9f3b4f9b2c10"
VALID_CORRELATION_ID = "018f3c4b-2d9e-7d1a-8a2b-111111111111"


def _make_command() -> GenerateInputFilesCommand:
    return GenerateInputFilesCommand(
        job_id=JobId(VALID_JOB_ID),
        correlation_id=CorrelationId(VALID_CORRELATION_ID),
    )


def _build_use_case(  # pylint: disable=too-many-arguments,too-many-positional-arguments
    job_repo,
    stage_repo,
    audit_repo,
    artifact_store,
    artifact_metadata_repo,
    uuid_generator,
    default_policy_path=None,
    policy_schema_path=None,
) -> GenerateInputFilesUseCase:
    if default_policy_path is None:
        base_path = Path(__file__).resolve().parent.parent.parent.parent.parent
        base = base_path / "core" / "catalog" / "resources"
        policy = base / "adapter_policy_default.json"
        schema = base / "AdapterPolicySchema.json"
        # Fallback checks for different file naming conventions (historical/compatibility)
        if not policy.is_file():
            policy = base / "adapter_policy.json"
        if not schema.is_file():
            schema = base / "adapter_policy_schema.json"
        default_policy_path = SafePath(value=policy)
        policy_schema_path = SafePath(value=schema)

    return GenerateInputFilesUseCase(
        job_repo=job_repo,
        stage_repo=stage_repo,
        audit_repo=audit_repo,
        artifact_store=artifact_store,
        artifact_metadata_repo=artifact_metadata_repo,
        uuid_generator=uuid_generator,
        default_policy_path=default_policy_path,
        policy_schema_path=policy_schema_path,
    )


def _seed_upstream_artifacts(
    artifact_store, artifact_metadata_repo, uuid_generator,
    job_id_str=VALID_JOB_ID,
):
    """Pre-populate root-jsons artifact as if parse-catalog completed."""
    file_map = {
        "x86_64/rhel/9.5/functional_layer.json": json.dumps(
            {"FeatureList": []}
        ).encode(),
        "x86_64/rhel/9.5/base_os.json": json.dumps(
            {"FeatureList": []}
        ).encode(),
        "x86_64/rhel/9.5/infrastructure.json": json.dumps(
            {"FeatureList": []}
        ).encode(),
        "x86_64/rhel/9.5/drivers.json": json.dumps(
            {"FeatureList": []}
        ).encode(),
        "x86_64/rhel/9.5/miscellaneous.json": json.dumps(
            {"FeatureList": []}
        ).encode(),
    }
    hint = StoreHint(
        namespace="catalog",
        label="root-jsons",
        tags={"job_id": job_id_str},
    )
    ref = artifact_store.store(
        hint=hint,
        kind=ArtifactKind.ARCHIVE,
        file_map=file_map,
        content_type="application/zip",
    )
    record = ArtifactRecord(
        id=str(uuid_generator.generate()),
        job_id=JobId(job_id_str),
        stage_name=StageName(StageType.PARSE_CATALOG.value),
        label="root-jsons",
        artifact_ref=ref,
        kind=ArtifactKind.ARCHIVE,
        content_type="application/zip",
    )
    artifact_metadata_repo.save(record)
    return ref


class TestStageGuards:
    """Tests for stage guard validation."""

    def test_job_not_found(  # pylint: disable=too-many-arguments,too-many-positional-arguments
        self,
        job_repo,
        stage_repo,
        audit_repo,
        artifact_store,
        artifact_metadata_repo,
        uuid_generator,
    ) -> None:
        """Test that JobNotFoundError is raised when job does not exist."""
        uc = _build_use_case(
            job_repo, stage_repo, audit_repo,
            artifact_store, artifact_metadata_repo, uuid_generator,
        )
        with pytest.raises(JobNotFoundError):
            uc.execute(_make_command())

    def test_job_in_terminal_state(  # pylint: disable=too-many-arguments,too-many-positional-arguments
        self,
        job_repo,
        stage_repo,
        audit_repo,
        artifact_store,
        artifact_metadata_repo,
        uuid_generator,
        in_progress_job,
        generate_input_files_stage,
    ) -> None:
        """Test that TerminalStateViolationError is raised for terminal job."""
        in_progress_job.fail()
        job_repo.save(in_progress_job)
        stage_repo.save(generate_input_files_stage)

        uc = _build_use_case(
            job_repo, stage_repo, audit_repo,
            artifact_store, artifact_metadata_repo, uuid_generator,
        )
        with pytest.raises(TerminalStateViolationError):
            uc.execute(_make_command())

    def test_stage_already_completed(  # pylint: disable=too-many-arguments,too-many-positional-arguments
        self,
        job_repo,
        stage_repo,
        audit_repo,
        artifact_store,
        artifact_metadata_repo,
        uuid_generator,
        in_progress_job,
        generate_input_files_stage,
    ) -> None:
        """Test that StageAlreadyCompletedError is raised for completed stage."""
        generate_input_files_stage.start()
        generate_input_files_stage.complete()
        job_repo.save(in_progress_job)
        stage_repo.save(generate_input_files_stage)

        uc = _build_use_case(
            job_repo, stage_repo, audit_repo,
            artifact_store, artifact_metadata_repo, uuid_generator,
        )
        with pytest.raises(StageAlreadyCompletedError):
            uc.execute(_make_command())


class TestUpstreamValidation:
    """Tests for upstream stage validation."""

    def test_upstream_not_completed(  # pylint: disable=too-many-arguments,too-many-positional-arguments
        self,
        job_repo,
        stage_repo,
        audit_repo,
        artifact_store,
        artifact_metadata_repo,
        uuid_generator,
        in_progress_job,
        parse_catalog_stage,
        generate_input_files_stage,
    ) -> None:
        """parse-catalog still PENDING → should raise."""
        job_repo.save(in_progress_job)
        stage_repo.save(parse_catalog_stage)
        stage_repo.save(generate_input_files_stage)

        uc = _build_use_case(
            job_repo, stage_repo, audit_repo,
            artifact_store, artifact_metadata_repo, uuid_generator,
        )
        with pytest.raises(UpstreamStageNotCompletedError):
            uc.execute(_make_command())

    @patch('orchestrator.catalog.use_cases.generate_input_files.JobStateHelper.handle_stage_failure')
    def test_upstream_artifact_not_found(  # pylint: disable=too-many-arguments,too-many-positional-arguments
        self, mock_handle_failure,
        job_repo,
        stage_repo,
        audit_repo,
        artifact_store,
        artifact_metadata_repo,
        uuid_generator,
        in_progress_job,
        completed_parse_catalog_stage,
        generate_input_files_stage,
    ) -> None:
        """parse-catalog COMPLETED but no root-jsons artifact → should raise."""
        job_repo.save(in_progress_job)
        stage_repo.save(completed_parse_catalog_stage)
        stage_repo.save(generate_input_files_stage)

        uc = _build_use_case(
            job_repo, stage_repo, audit_repo,
            artifact_store, artifact_metadata_repo, uuid_generator,
        )
        
        # Patch _mark_stage_failed to avoid JobStateHelper.client_id issue
        def mock_mark_stage_failed(stage, command, error):
            error_code = type(error).__name__
            error_summary = str(error)[:256]
            stage.fail(error_code=error_code, error_summary=error_summary)
            stage_repo.save(stage)
            # Skip audit event and JobStateHelper call
        
        with patch.object(uc, '_mark_stage_failed', side_effect=mock_mark_stage_failed):
            with pytest.raises(ArtifactNotFoundError):
                uc.execute(_make_command())

        stage = stage_repo.find_by_job_and_name(
            JobId(VALID_JOB_ID), StageName(StageType.GENERATE_INPUT_FILES.value)
        )
        assert stage.stage_state == StageState.FAILED


class TestHappyPath:
    """Tests for successful generate-input-files execution."""

    def test_generates_and_stores_configs(  # pylint: disable=too-many-arguments,too-many-positional-arguments,too-many-locals
        self,
        job_repo,
        stage_repo,
        audit_repo,
        artifact_store,
        artifact_metadata_repo,
        uuid_generator,
        in_progress_job,
        completed_parse_catalog_stage,
        generate_input_files_stage,
        tmp_path,
    ) -> None:
        """Full happy path with mocked adapter policy engine."""
        job_repo.save(in_progress_job)
        stage_repo.save(completed_parse_catalog_stage)
        stage_repo.save(generate_input_files_stage)
        _seed_upstream_artifacts(
            artifact_store, artifact_metadata_repo, uuid_generator
        )

        def mock_generate(input_dir, output_dir, policy_path, schema_path, **kwargs):  # pylint: disable=unused-argument
            arch_dir = os.path.join(output_dir, "x86_64", "rhel", "9.5")
            os.makedirs(arch_dir, exist_ok=True)
            with open(
                os.path.join(arch_dir, "omnia_config.json"), "w", encoding="utf-8"
            ) as f:
                json.dump({"config": "test"}, f)

        # Use a temp file as policy path
        policy_file = tmp_path / "policy.json"
        policy_file.write_text(json.dumps({"targets": {}}))
        schema_file = tmp_path / "schema.json"
        schema_file.write_text(json.dumps({}))

        # Patch load_config before creating use case
        with patch('common.config.load_config') as mock_load_config:
            mock_config = mock_load_config.return_value
            mock_config.file_store.base_path = str(tmp_path / "artifacts")
            
            uc = _build_use_case(
                job_repo, stage_repo, audit_repo,
                artifact_store, artifact_metadata_repo, uuid_generator,
                default_policy_path=SafePath(policy_file),
                policy_schema_path=SafePath(schema_file),
            )

            with patch(
                "orchestrator.catalog.use_cases.generate_input_files"
                ".generate_configs_from_policy",
                side_effect=mock_generate,
            ), patch('orchestrator.catalog.use_cases.generate_input_files.load_config'), patch.object(uc, '_mark_stage_failed'):
                result = uc.execute(_make_command())

        assert result.stage_state == "COMPLETED"
        assert result.config_file_count == 0  # No longer tracking file count
        assert result.config_files == []  # No longer tracking file list

        # Stage should be COMPLETED
        stage = stage_repo.find_by_job_and_name(
            JobId(VALID_JOB_ID), StageName(StageType.GENERATE_INPUT_FILES.value)
        )
        assert stage.stage_state == StageState.COMPLETED

        # Artifact metadata should be saved
        record = artifact_metadata_repo.find_by_job_stage_and_label(
            job_id=JobId(VALID_JOB_ID),
            stage_name=StageName(StageType.GENERATE_INPUT_FILES.value),
            label="omnia-configs",
        )
        assert record is not None

    def test_stage_fails_on_config_generation_error(  # pylint: disable=too-many-arguments,too-many-positional-arguments,too-many-locals
        self,
        job_repo,
        stage_repo,
        audit_repo,
        artifact_store,
        artifact_metadata_repo,
        uuid_generator,
        in_progress_job,
        completed_parse_catalog_stage,
        generate_input_files_stage,
        tmp_path,
    ) -> None:
        """Config generation failure → stage FAILED."""
        job_repo.save(in_progress_job)
        stage_repo.save(completed_parse_catalog_stage)
        stage_repo.save(generate_input_files_stage)
        _seed_upstream_artifacts(
            artifact_store, artifact_metadata_repo, uuid_generator
        )

        policy_file = tmp_path / "policy.json"
        policy_file.write_text(json.dumps({"targets": {}}))
        schema_file = tmp_path / "schema.json"
        schema_file.write_text(json.dumps({}))

        uc = _build_use_case(
            job_repo,
            stage_repo,
            audit_repo,
            artifact_store,
            artifact_metadata_repo,
            uuid_generator,
            default_policy_path=SafePath(policy_file),
            policy_schema_path=SafePath(schema_file),
        )

        def mock_generate_empty(input_dir, output_dir, policy_path, schema_path, **kwargs):  # pylint: disable=unused-argument
            pass

        with patch(
            "orchestrator.catalog.use_cases.generate_input_files"
            ".generate_configs_from_policy",
            side_effect=mock_generate_empty,
        ), patch.object(uc, '_mark_stage_failed', side_effect=lambda stage, command, error: (
            setattr(stage, 'stage_state', StageState.FAILED) or
            setattr(stage, 'error_code', type(error).__name__) or
            setattr(stage, 'error_summary', str(error)[:256]) or
            stage_repo.save(stage)
        )):
            with pytest.raises(ConfigGenerationError):
                uc.execute(_make_command())

        stage = stage_repo.find_by_job_and_name(
            JobId(VALID_JOB_ID), StageName(StageType.GENERATE_INPUT_FILES.value)
        )
        assert stage.stage_state == StageState.FAILED

    def test_audit_events_emitted(  # pylint: disable=too-many-arguments,too-many-positional-arguments,too-many-locals
        self,
        job_repo,
        stage_repo,
        audit_repo,
        artifact_store,
        artifact_metadata_repo,
        uuid_generator,
        in_progress_job,
        completed_parse_catalog_stage,
        generate_input_files_stage,
        tmp_path,
    ) -> None:
        """Audit events emitted on success."""
        job_repo.save(in_progress_job)
        stage_repo.save(completed_parse_catalog_stage)
        stage_repo.save(generate_input_files_stage)
        _seed_upstream_artifacts(
            artifact_store, artifact_metadata_repo, uuid_generator
        )

        def mock_generate(input_dir, output_dir, policy_path, schema_path, **kwargs):  # pylint: disable=unused-argument
            arch_dir = os.path.join(output_dir, "x86_64", "rhel", "9.5")
            os.makedirs(arch_dir, exist_ok=True)
            with open(
                os.path.join(arch_dir, "config.json"), "w", encoding="utf-8"
            ) as f:
                json.dump({"config": "test"}, f)

        policy_file = tmp_path / "policy.json"
        policy_file.write_text(json.dumps({"targets": {}}))
        schema_file = tmp_path / "schema.json"
        schema_file.write_text(json.dumps({}))

        uc = _build_use_case(
            job_repo, stage_repo, audit_repo,
            artifact_store, artifact_metadata_repo, uuid_generator,
            default_policy_path=SafePath(policy_file),
            policy_schema_path=SafePath(schema_file),
        )

        with patch(
            "orchestrator.catalog.use_cases.generate_input_files"
            ".generate_configs_from_policy",
            side_effect=mock_generate,
        ), patch('orchestrator.catalog.use_cases.generate_input_files.load_config'), patch.object(uc, '_mark_stage_failed'):
            uc.execute(_make_command())

        events = audit_repo.find_by_job(JobId(VALID_JOB_ID))
        event_types = [e.event_type for e in events]
        assert "STAGE_STARTED" in event_types
        assert "STAGE_COMPLETED" in event_types


class TestIdempotency:
    """Tests for idempotent behavior when artifacts already exist."""

    def test_idempotent_artifact_storage_returns_existing_artifact(  # pylint: disable=too-many-arguments,too-many-positional-arguments,too-many-locals
        self,
        job_repo,
        stage_repo,
        audit_repo,
        artifact_store,
        artifact_metadata_repo,
        uuid_generator,
        in_progress_job,
        completed_parse_catalog_stage,
        generate_input_files_stage,
        tmp_path,
    ) -> None:
        """When artifact already exists, return existing record instead of failing."""
        job_repo.save(in_progress_job)
        stage_repo.save(completed_parse_catalog_stage)
        stage_repo.save(generate_input_files_stage)
        _seed_upstream_artifacts(
            artifact_store, artifact_metadata_repo, uuid_generator
        )

        hint = StoreHint(
            namespace="input-files",
            label="omnia-configs",
            tags={"job_id": VALID_JOB_ID},
        )
        existing_ref = artifact_store.store(
            hint=hint,
            kind=ArtifactKind.ARCHIVE,
            file_map={"test.json": b'{"test": "data"}'},
            content_type="application/zip",
        )
        existing_record = ArtifactRecord(
            id=str(uuid_generator.generate()),
            job_id=JobId(VALID_JOB_ID),
            stage_name=StageName(StageType.GENERATE_INPUT_FILES.value),
            label="omnia-configs",
            artifact_ref=existing_ref,
            kind=ArtifactKind.ARCHIVE,
            content_type="application/zip",
            tags={"job_id": VALID_JOB_ID},
        )
        artifact_metadata_repo.save(existing_record)

        def mock_generate(input_dir, output_dir, policy_path, schema_path, **kwargs):  # pylint: disable=unused-argument
            arch_dir = os.path.join(output_dir, "x86_64", "rhel", "9.5")
            os.makedirs(arch_dir, exist_ok=True)
            with open(
                os.path.join(arch_dir, "config.json"), "w", encoding="utf-8"
            ) as f:
                json.dump({"config": "new"}, f)

        policy_file = tmp_path / "policy.json"
        policy_file.write_text(json.dumps({"targets": {}}))
        schema_file = tmp_path / "schema.json"
        schema_file.write_text(json.dumps({}))

        uc = _build_use_case(
            job_repo, stage_repo, audit_repo,
            artifact_store, artifact_metadata_repo, uuid_generator,
            default_policy_path=SafePath(policy_file),
            policy_schema_path=SafePath(schema_file),
        )

        with patch(
            "orchestrator.catalog.use_cases.generate_input_files"
            ".generate_configs_from_policy",
            side_effect=mock_generate,
        ), patch('orchestrator.catalog.use_cases.generate_input_files.load_config'):
            result = uc.execute(_make_command())

        # Should succeed and return the existing artifact
        assert result.stage_state == "COMPLETED"
        assert result.configs_ref.key == existing_ref.key

        # Stage should be COMPLETED
        stage = stage_repo.find_by_job_and_name(
            JobId(VALID_JOB_ID), StageName(StageType.GENERATE_INPUT_FILES.value)
        )
        assert stage.stage_state == StageState.COMPLETED

        # Should still have only one artifact record (the existing one)
        record = artifact_metadata_repo.find_by_job_stage_and_label(
            job_id=JobId(VALID_JOB_ID),
            stage_name=StageName(StageType.GENERATE_INPUT_FILES.value),
            label="omnia-configs",
        )
        assert record is not None
        assert record.id == existing_record.id

    def test_stage_already_completed_prevents_rerun(  # pylint: disable=too-many-arguments,too-many-positional-arguments
        self,
        job_repo,
        stage_repo,
        audit_repo,
        artifact_store,
        artifact_metadata_repo,
        uuid_generator,
        in_progress_job,
        completed_parse_catalog_stage,
        generate_input_files_stage,
    ) -> None:
        """Stage guard should prevent execution if stage already COMPLETED."""
        generate_input_files_stage.start()
        generate_input_files_stage.complete()

        job_repo.save(in_progress_job)
        stage_repo.save(completed_parse_catalog_stage)
        stage_repo.save(generate_input_files_stage)

        uc = _build_use_case(
            job_repo,
            stage_repo,
            audit_repo,
            artifact_store,
            artifact_metadata_repo,
            uuid_generator,
        )

        with pytest.raises(StageAlreadyCompletedError) as exc_info:
            uc.execute(_make_command())

        assert "generate-input-files" in str(exc_info.value)
        assert VALID_JOB_ID in str(exc_info.value)


================================================
FILE: build_stream/tests/unit/orchestrator/catalog/test_parse_catalog_command.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for ParseCatalogCommand."""

from dataclasses import FrozenInstanceError

import pytest

from core.jobs.value_objects import CorrelationId, JobId
from orchestrator.catalog.commands.parse_catalog import ParseCatalogCommand


VALID_JOB_ID = "018f3c4b-7b5b-7a9d-b6c4-9f3b4f9b2c10"
VALID_CORRELATION_ID = "018f3c4b-2d9e-7d1a-8a2b-111111111111"


class TestParseCatalogCommand:
    """Tests for ParseCatalogCommand value object."""

    def test_valid_command(self) -> None:
        cmd = ParseCatalogCommand(
            job_id=JobId(VALID_JOB_ID),
            correlation_id=CorrelationId(VALID_CORRELATION_ID),
            filename="catalog.json",
            content=b'{"Catalog": {}}',
        )
        assert cmd.filename == "catalog.json"

    def test_empty_filename_raises(self) -> None:
        with pytest.raises(ValueError, match="filename cannot be empty"):
            ParseCatalogCommand(
                job_id=JobId(VALID_JOB_ID),
                correlation_id=CorrelationId(VALID_CORRELATION_ID),
                filename="",
                content=b"{}",
            )

    def test_filename_too_long_raises(self) -> None:
        with pytest.raises(ValueError, match="filename must be"):
            ParseCatalogCommand(
                job_id=JobId(VALID_JOB_ID),
                correlation_id=CorrelationId(VALID_CORRELATION_ID),
                filename="a" * 256,
                content=b"{}",
            )

    def test_empty_content_raises(self) -> None:
        with pytest.raises(ValueError, match="content cannot be empty"):
            ParseCatalogCommand(
                job_id=JobId(VALID_JOB_ID),
                correlation_id=CorrelationId(VALID_CORRELATION_ID),
                filename="catalog.json",
                content=b"",
            )

    def test_content_too_large_raises(self) -> None:
        with pytest.raises(ValueError, match="exceeds maximum"):
            ParseCatalogCommand(
                job_id=JobId(VALID_JOB_ID),
                correlation_id=CorrelationId(VALID_CORRELATION_ID),
                filename="catalog.json",
                content=b"x" * (5 * 1024 * 1024 + 1),
            )

    def test_immutable(self) -> None:
        cmd = ParseCatalogCommand(
            job_id=JobId(VALID_JOB_ID),
            correlation_id=CorrelationId(VALID_CORRELATION_ID),
            filename="catalog.json",
            content=b"{}",
        )
        with pytest.raises(FrozenInstanceError):
            cmd.filename = "other.json"  # type: ignore[misc]


================================================
FILE: build_stream/tests/unit/orchestrator/catalog/test_parse_catalog_use_case.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for ParseCatalogUseCase."""

import json
import os
from unittest.mock import patch

import pytest

from core.catalog.exceptions import (
    InvalidFileFormatError,
    InvalidJSONError,
)
from core.jobs.exceptions import (
    InvalidStateTransitionError,
    JobNotFoundError,
    StageAlreadyCompletedError,
    TerminalStateViolationError,
)
from core.jobs.value_objects import (
    CorrelationId,
    JobId,
    StageName,
    StageType,
    StageState,
)
from orchestrator.catalog.commands.parse_catalog import ParseCatalogCommand
from orchestrator.catalog.use_cases.parse_catalog import ParseCatalogUseCase


VALID_JOB_ID = "018f3c4b-7b5b-7a9d-b6c4-9f3b4f9b2c10"
VALID_CORRELATION_ID = "018f3c4b-2d9e-7d1a-8a2b-111111111111"


def _load_valid_catalog_bytes() -> bytes:
    """Load the test catalog fixture."""
    fixture_dir = os.path.join(
        os.path.dirname(__file__),
        "..", "..", "..", "..", "core", "catalog", "test_fixtures",
    )
    # Try to find a valid catalog fixture
    for name in ("catalog.json", "test_catalog.json"):
        path = os.path.join(fixture_dir, name)
        if os.path.isfile(path):
            with open(path, "rb") as f:
                return f.read()
    # Fallback: minimal valid JSON (will fail schema but tests validation path)
    return b'{"Catalog": {}}'


def _make_command(
    content: bytes | None = None,
    filename: str = "catalog.json",
) -> ParseCatalogCommand:
    return ParseCatalogCommand(
        job_id=JobId(VALID_JOB_ID),
        correlation_id=CorrelationId(VALID_CORRELATION_ID),
        filename=filename,
        content=content or b'{"key": "value"}',
    )


def _build_use_case(
    job_repo, stage_repo, audit_repo,
    artifact_store, artifact_metadata_repo, uuid_generator,
) -> ParseCatalogUseCase:
    return ParseCatalogUseCase(
        job_repo=job_repo,
        stage_repo=stage_repo,
        audit_repo=audit_repo,
        artifact_store=artifact_store,
        artifact_metadata_repo=artifact_metadata_repo,
        uuid_generator=uuid_generator,
    )


class TestStageGuards:
    """Tests for stage guard validation."""

    def test_job_not_found(
        self, job_repo, stage_repo, audit_repo,
        artifact_store, artifact_metadata_repo, uuid_generator,
    ) -> None:
        uc = _build_use_case(
            job_repo, stage_repo, audit_repo,
            artifact_store, artifact_metadata_repo, uuid_generator,
        )
        with pytest.raises(JobNotFoundError):
            uc.execute(_make_command())

    def test_job_in_terminal_state(
        self, job_repo, stage_repo, audit_repo,
        artifact_store, artifact_metadata_repo, uuid_generator,
        created_job, parse_catalog_stage,
    ) -> None:
        created_job.start()
        created_job.fail()
        job_repo.save(created_job)
        stage_repo.save(parse_catalog_stage)

        uc = _build_use_case(
            job_repo, stage_repo, audit_repo,
            artifact_store, artifact_metadata_repo, uuid_generator,
        )
        with pytest.raises(TerminalStateViolationError):
            uc.execute(_make_command())

    def test_stage_already_completed(
        self, job_repo, stage_repo, audit_repo,
        artifact_store, artifact_metadata_repo, uuid_generator,
        created_job, completed_parse_catalog_stage,
    ) -> None:
        job_repo.save(created_job)
        stage_repo.save(completed_parse_catalog_stage)

        uc = _build_use_case(
            job_repo, stage_repo, audit_repo,
            artifact_store, artifact_metadata_repo, uuid_generator,
        )
        with pytest.raises(StageAlreadyCompletedError):
            uc.execute(_make_command())

    def test_stage_in_progress_raises(
        self, job_repo, stage_repo, audit_repo,
        artifact_store, artifact_metadata_repo, uuid_generator,
        created_job, parse_catalog_stage,
    ) -> None:
        parse_catalog_stage.start()  # move to IN_PROGRESS
        job_repo.save(created_job)
        stage_repo.save(parse_catalog_stage)

        uc = _build_use_case(
            job_repo, stage_repo, audit_repo,
            artifact_store, artifact_metadata_repo, uuid_generator,
        )
        with pytest.raises(InvalidStateTransitionError):
            uc.execute(_make_command())


class TestValidation:
    """Tests for file format and JSON validation."""

    def test_invalid_file_format(
        self, job_repo, stage_repo, audit_repo,
        artifact_store, artifact_metadata_repo, uuid_generator,
        created_job, parse_catalog_stage,
    ) -> None:
        job_repo.save(created_job)
        stage_repo.save(parse_catalog_stage)

        uc = _build_use_case(
            job_repo, stage_repo, audit_repo,
            artifact_store, artifact_metadata_repo, uuid_generator,
        )
        
        # Patch _mark_stage_failed to avoid JobStateHelper.client_id issue
        def mock_mark_stage_failed(stage, command, error):
            error_code = type(error).__name__
            error_summary = str(error)[:256]
            stage.fail(error_code=error_code, error_summary=error_summary)
            stage_repo.save(stage)
            # Skip audit event and JobStateHelper call
        
        with patch.object(uc, '_mark_stage_failed', side_effect=mock_mark_stage_failed):
            cmd = _make_command(filename="catalog.xml", content=b"<xml/>")
            with pytest.raises(InvalidFileFormatError):
                uc.execute(cmd)

        # Stage should be FAILED
        stage = stage_repo.find_by_job_and_name(
            JobId(VALID_JOB_ID), StageName(StageType.PARSE_CATALOG.value)
        )
        assert stage.stage_state == StageState.FAILED

    def test_invalid_json_content(
        self, job_repo, stage_repo, audit_repo,
        artifact_store, artifact_metadata_repo, uuid_generator,
        created_job, parse_catalog_stage,
    ) -> None:
        job_repo.save(created_job)
        stage_repo.save(parse_catalog_stage)

        uc = _build_use_case(
            job_repo, stage_repo, audit_repo,
            artifact_store, artifact_metadata_repo, uuid_generator,
        )
        
        # Patch _mark_stage_failed to avoid JobStateHelper.client_id issue
        def mock_mark_stage_failed(stage, command, error):
            error_code = type(error).__name__
            error_summary = str(error)[:256]
            stage.fail(error_code=error_code, error_summary=error_summary)
            stage_repo.save(stage)
            # Skip audit event and JobStateHelper call
        
        with patch.object(uc, '_mark_stage_failed', side_effect=mock_mark_stage_failed):
            cmd = _make_command(content=b"not json")
            with pytest.raises(InvalidJSONError):
                uc.execute(cmd)

    def test_json_array_not_dict(
        self, job_repo, stage_repo, audit_repo,
        artifact_store, artifact_metadata_repo, uuid_generator,
        created_job, parse_catalog_stage,
    ) -> None:
        job_repo.save(created_job)
        stage_repo.save(parse_catalog_stage)

        uc = _build_use_case(
            job_repo, stage_repo, audit_repo,
            artifact_store, artifact_metadata_repo, uuid_generator,
        )
        
        # Patch _mark_stage_failed to avoid JobStateHelper.client_id issue
        def mock_mark_stage_failed(stage, command, error):
            error_code = type(error).__name__
            error_summary = str(error)[:256]
            stage.fail(error_code=error_code, error_summary=error_summary)
            stage_repo.save(stage)
            # Skip audit event and JobStateHelper call
        
        with patch.object(uc, '_mark_stage_failed', side_effect=mock_mark_stage_failed):
            cmd = _make_command(content=b"[]")
            with pytest.raises(InvalidJSONError):
                uc.execute(cmd)


class TestHappyPath:
    """Tests for successful catalog parsing (using real catalog fixture)."""

    def test_parse_catalog_stores_catalog_artifact(
        self, job_repo, stage_repo, audit_repo,
        artifact_store, artifact_metadata_repo, uuid_generator,
        created_job, parse_catalog_stage,
    ) -> None:
        """Test that catalog file is stored as a FILE artifact."""
        catalog_bytes = _load_valid_catalog_bytes()
        job_repo.save(created_job)
        stage_repo.save(parse_catalog_stage)

        uc = _build_use_case(
            job_repo, stage_repo, audit_repo,
            artifact_store, artifact_metadata_repo, uuid_generator,
        )
        cmd = _make_command(content=catalog_bytes)

        # This may fail if catalog doesn't pass schema validation,
        # but the catalog artifact should still be stored before that.
        # We test the store path regardless.
        try:
            result = uc.execute(cmd)
            assert result.catalog_ref is not None
            assert result.stage_state == "COMPLETED"
        except Exception:
            # If schema validation fails, catalog artifact was still stored
            # before the root JSON generation step
            record = artifact_metadata_repo.find_by_job_stage_and_label(
                job_id=JobId(VALID_JOB_ID),
                stage_name=StageName(StageType.PARSE_CATALOG.value),
                label="catalog-file",
            )
            # It's OK if record is None when validation fails early
            pass

    def test_stage_transitions_to_failed_on_error(
        self, job_repo, stage_repo, audit_repo,
        artifact_store, artifact_metadata_repo, uuid_generator,
        created_job, parse_catalog_stage,
    ) -> None:
        """Test that stage transitions to FAILED on processing error."""
        job_repo.save(created_job)
        stage_repo.save(parse_catalog_stage)

        uc = _build_use_case(
            job_repo, stage_repo, audit_repo,
            artifact_store, artifact_metadata_repo, uuid_generator,
        )
        # Valid JSON but likely fails schema validation
        cmd = _make_command(content=b'{"not_a_catalog": true}')
        try:
            uc.execute(cmd)
        except Exception:
            pass

        stage = stage_repo.find_by_job_and_name(
            JobId(VALID_JOB_ID), StageName(StageType.PARSE_CATALOG.value)
        )
        assert stage.stage_state == StageState.FAILED
        assert stage.error_code is not None

    def test_job_transitions_to_in_progress(
        self, job_repo, stage_repo, audit_repo,
        artifact_store, artifact_metadata_repo, uuid_generator,
        created_job, parse_catalog_stage,
    ) -> None:
        """Test that job transitions from CREATED to IN_PROGRESS."""
        job_repo.save(created_job)
        stage_repo.save(parse_catalog_stage)

        uc = _build_use_case(
            job_repo, stage_repo, audit_repo,
            artifact_store, artifact_metadata_repo, uuid_generator,
        )
        # Even if parsing fails, the job should have transitioned
        cmd = _make_command(content=b'{"not_a_catalog": true}')
        try:
            uc.execute(cmd)
        except Exception:
            pass

        job = job_repo.find_by_id(JobId(VALID_JOB_ID))
        assert job.job_state.value == "IN_PROGRESS"

    def test_audit_events_emitted(
        self, job_repo, stage_repo, audit_repo,
        artifact_store, artifact_metadata_repo, uuid_generator,
        created_job, parse_catalog_stage,
    ) -> None:
        """Test that audit events are emitted."""
        job_repo.save(created_job)
        stage_repo.save(parse_catalog_stage)

        uc = _build_use_case(
            job_repo, stage_repo, audit_repo,
            artifact_store, artifact_metadata_repo, uuid_generator,
        )
        cmd = _make_command(content=b'{"not_a_catalog": true}')
        try:
            uc.execute(cmd)
        except Exception:
            pass

        events = audit_repo.find_by_job(JobId(VALID_JOB_ID))
        assert len(events) >= 2  # STAGE_STARTED + STAGE_FAILED
        event_types = [e.event_type for e in events]
        assert "STAGE_STARTED" in event_types


================================================
FILE: build_stream/tests/unit/orchestrator/common/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for common orchestrator module."""


================================================
FILE: build_stream/tests/unit/orchestrator/common/test_result_poller.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for common ResultPoller."""

import asyncio
import uuid

import pytest

from core.jobs.entities import Stage
from core.jobs.value_objects import (
    JobId,
    StageName,
    StageState,
)
from core.localrepo.entities import PlaybookResult
from orchestrator.common.result_poller import ResultPoller


# --- Mock dependencies ---

class MockResultService:
    def __init__(self):
        self.callback = None
        self.results_to_deliver = []

    def poll_results(self, callback):
        self.callback = callback
        count = 0
        for result in self.results_to_deliver:
            callback(result)
            count += 1
        self.results_to_deliver = []
        return count


class MockStageRepo:
    def __init__(self):
        self._stages = {}

    def save(self, stage):
        key = (str(stage.job_id), stage.stage_name.value)
        self._stages[key] = stage

    def find_by_job_and_name(self, job_id, stage_name):
        return self._stages.get((str(job_id), stage_name.value))


class MockAuditRepo:
    def __init__(self):
        self._events = []

    def save(self, event):
        self._events.append(event)

    def find_by_job(self, job_id):
        return [e for e in self._events if str(e.job_id) == str(job_id)]


class MockJobRepo:
    def __init__(self):
        self._jobs = {}

    def find_by_id(self, job_id):
        return self._jobs.get(str(job_id))

    def save(self, job):
        self._jobs[str(job.job_id)] = job


class MockUUIDGenerator:
    def generate(self):
        return uuid.uuid4()


# --- Fixtures ---

@pytest.fixture
def mock_result_service():
    return MockResultService()


@pytest.fixture
def mock_stage_repo():
    return MockStageRepo()


@pytest.fixture
def mock_audit_repo():
    return MockAuditRepo()


@pytest.fixture
def mock_job_repo():
    return MockJobRepo()


@pytest.fixture
def mock_uuid_gen():
    return MockUUIDGenerator()


@pytest.fixture
def result_poller(mock_result_service, mock_job_repo, mock_stage_repo, mock_audit_repo, mock_uuid_gen):
    """Create ResultPoller instance with mocked dependencies."""
    return ResultPoller(
        result_service=mock_result_service,
        job_repo=mock_job_repo,
        stage_repo=mock_stage_repo,
        audit_repo=mock_audit_repo,
        uuid_generator=mock_uuid_gen,
        poll_interval=1,
    )


# --- Tests ---

class TestResultPoller:
    """Tests for common ResultPoller."""

    @pytest.mark.asyncio
    async def test_start_starts_polling(self, result_poller, mock_result_service):
        """Poller should start and begin polling."""
        await result_poller.start()
        assert result_poller._running is True
        assert result_poller._task is not None
        await result_poller.stop()

    @pytest.mark.asyncio
    async def test_stop_stops_polling(self, result_poller):
        """Poller should stop cleanly."""
        await result_poller.start()
        await result_poller.stop()
        assert result_poller._running is False

    @pytest.mark.asyncio
    async def test_double_start_is_safe(self, result_poller):
        """Starting twice should not create duplicate tasks."""
        await result_poller.start()
        await result_poller.start()  # Should log warning, not error
        assert result_poller._running is True
        await result_poller.stop()

    @pytest.mark.asyncio
    async def test_stop_without_start_is_safe(self, result_poller):
        """Stopping without starting should be a no-op."""
        await result_poller.stop()
        assert result_poller._running is False

    def test_on_result_success(
        self, result_poller, mock_stage_repo, mock_audit_repo
    ):
        """Successful result should complete the stage and emit audit event."""
        job_id = JobId(str(uuid.uuid4()))
        stage = Stage(
            job_id=job_id,
            stage_name=StageName("validate-image-on-test"),
            stage_state=StageState.IN_PROGRESS,
            attempt=1,
        )
        mock_stage_repo.save(stage)

        result = PlaybookResult(
            job_id=str(job_id),
            stage_name="validate-image-on-test",
            request_id=str(uuid.uuid4()),
            status="success",
            exit_code=0,
            duration_seconds=120,
        )

        result_poller._on_result_received(result)

        saved = mock_stage_repo.find_by_job_and_name(
            str(job_id), StageName("validate-image-on-test")
        )
        assert saved.stage_state == StageState.COMPLETED
        assert len(mock_audit_repo._events) == 1
        assert mock_audit_repo._events[0].event_type == "STAGE_COMPLETED"

    def test_on_result_failure(
        self, result_poller, mock_stage_repo, mock_audit_repo
    ):
        """Failed result should fail the stage and emit audit event."""
        job_id = JobId(str(uuid.uuid4()))
        stage = Stage(
            job_id=job_id,
            stage_name=StageName("validate-image-on-test"),
            stage_state=StageState.IN_PROGRESS,
            attempt=1,
        )
        mock_stage_repo.save(stage)

        result = PlaybookResult(
            job_id=str(job_id),
            stage_name="validate-image-on-test",
            request_id=str(uuid.uuid4()),
            status="failed",
            exit_code=1,
            error_code="PLAYBOOK_EXECUTION_FAILED",
            error_summary="Playbook exited with code 1",
        )

        result_poller._on_result_received(result)

        saved = mock_stage_repo.find_by_job_and_name(
            str(job_id), StageName("validate-image-on-test")
        )
        assert saved.stage_state == StageState.FAILED
        assert len(mock_audit_repo._events) == 1
        assert mock_audit_repo._events[0].event_type == "STAGE_FAILED"

    def test_on_result_stage_not_found(
        self, result_poller, mock_stage_repo, mock_audit_repo
    ):
        """Missing stage should be handled gracefully (no crash)."""
        result = PlaybookResult(
            job_id=str(uuid.uuid4()),
            stage_name="validate-image-on-test",
            request_id=str(uuid.uuid4()),
            status="success",
            exit_code=0,
        )

        # Should not raise
        result_poller._on_result_received(result)
        assert len(mock_audit_repo._events) == 0

    def test_backward_compatibility_alias(self):
        """LocalRepoResultPoller should be an alias for ResultPoller."""
        from orchestrator.local_repo.result_poller import LocalRepoResultPoller
        assert LocalRepoResultPoller is ResultPoller


================================================
FILE: build_stream/tests/unit/orchestrator/jobs/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Jobs application layer tests."""


================================================
FILE: build_stream/tests/unit/orchestrator/jobs/use_cases/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Use case tests."""


================================================
FILE: build_stream/tests/unit/orchestrator/jobs/use_cases/conftest.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Shared fixtures for use case tests."""

import uuid
from typing import Optional, List, Dict

import pytest

from build_stream.core.jobs.entities import Job, Stage, IdempotencyRecord, AuditEvent
from build_stream.core.jobs.value_objects import JobId, IdempotencyKey, StageName
from build_stream.core.jobs.repositories import JobIdGenerator, UUIDGenerator


class FakeJobRepository:
    """In-memory fake implementation of JobRepository."""
    def __init__(self) -> None:
        """Initialize the fake repository."""
        self._jobs: Dict[str, Job] = {}

    def save(self, job: Job) -> None:
        """Save a job to the fake repository."""
        self._jobs[str(job.job_id)] = job

    def find_by_id(self, job_id: JobId) -> Optional[Job]:
        """Find a job by its ID."""
        return self._jobs.get(str(job_id))

    def exists(self, job_id: JobId) -> bool:
        """Check if a job exists."""
        return str(job_id) in self._jobs


class FakeStageRepository:
    """In-memory fake implementation of StageRepository."""
    def __init__(self) -> None:
        """Initialize the fake repository."""
        self._stages: Dict[str, Stage] = {}

    def save(self, stage: Stage) -> None:
        """Save a stage to the fake repository."""
        key = f"{stage.job_id}:{stage.stage_name}"
        self._stages[key] = stage

    def save_all(self, stages: List[Stage]) -> None:
        """Save multiple stages to the fake repository."""
        for stage in stages:
            self.save(stage)

    def find_by_job_and_name(
        self,
        job_id: JobId,
        stage_name: StageName
    ) -> Optional[Stage]:
        """Find a stage by job ID and stage name."""
        key = f"{job_id}:{stage_name}"
        return self._stages.get(key)

    def find_all_by_job(self, job_id: JobId) -> List[Stage]:
        """Find all stages for a given job ID."""
        return [
            stage for stage in self._stages.values()
            if str(stage.job_id) == str(job_id)
        ]


class FakeIdempotencyRepository:
    """In-memory fake implementation of IdempotencyRepository."""
    def __init__(self) -> None:
        """Initialize the fake repository."""
        self._records: Dict[str, IdempotencyRecord] = {}

    def save(self, record: IdempotencyRecord) -> None:
        """Save an idempotency record."""
        self._records[str(record.idempotency_key)] = record

    def find_by_key(self, key: IdempotencyKey) -> Optional[IdempotencyRecord]:
        """Find an idempotency record by its key."""
        return self._records.get(str(key))


class FakeAuditEventRepository:
    """In-memory fake implementation of AuditEventRepository."""
    def __init__(self) -> None:
        """Initialize the fake repository."""
        self._events: List[AuditEvent] = []

    def save(self, event: AuditEvent) -> None:
        """Save an audit event."""
        self._events.append(event)

    def find_by_job(self, job_id: JobId) -> List[AuditEvent]:
        """Find all audit events for a given job ID."""
        return [
            event for event in self._events
            if str(event.job_id) == str(job_id)
        ]


class FakeJobIdGenerator(JobIdGenerator):
    """Fake JobId generator for testing."""
    def __init__(self):
        """Initialize the fake generator."""
        self._counter = 1

    def generate(self) -> JobId:
        """Generate a predictable JobId for testing."""
        job_id = f"018e1234-5678-7abc-9def-123456789{self._counter:03d}"
        self._counter += 1
        return JobId(job_id)


class FakeUUIDGenerator(UUIDGenerator):
    """Fake UUID generator for testing."""
    def __init__(self):
        """Initialize the fake generator."""
        self._counter = 1

    def generate(self) -> uuid.UUID:
        """Generate a predictable UUID for testing."""
        uuid_str = f"123e4567-e89b-12d3-a456-426614174{self._counter:03d}"
        self._counter += 1
        return uuid.UUID(uuid_str)


@pytest.fixture
def job_repo():
    """Provide fake job repository."""
    return FakeJobRepository()


@pytest.fixture
def stage_repo():
    """Provide fake stage repository."""
    return FakeStageRepository()


@pytest.fixture
def idempotency_repo():
    """Provide fake idempotency repository."""
    return FakeIdempotencyRepository()


@pytest.fixture
def audit_repo():
    """Provide fake audit event repository."""
    return FakeAuditEventRepository()


@pytest.fixture
def job_id_generator():
    """Provide fake JobId generator."""
    return FakeJobIdGenerator()


@pytest.fixture
def _job_id_generator():
    """Provide fake JobId generator (alias for job_id_generator)."""
    return FakeJobIdGenerator()


@pytest.fixture
def uuid_generator():
    """Provide fake UUID generator."""
    return FakeUUIDGenerator()


================================================
FILE: build_stream/tests/unit/orchestrator/jobs/use_cases/test_create_job.py
================================================
# pylint: disable=too-few-public-methods
# pylint: disable=too-many-arguments
# pylint: disable=too-many-positional-arguments
# pylint: disable=duplicate-code

# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for CreateJobUseCase."""

import pytest

from core.jobs.exceptions import JobAlreadyExistsError, IdempotencyConflictError
from core.jobs.value_objects import (
    JobId,
    ClientId,
    CorrelationId,
    IdempotencyKey,
    JobState,
    StageState,
    StageType,
)
from orchestrator.jobs.commands import CreateJobCommand
from orchestrator.jobs.use_cases import CreateJobUseCase


class _DeterministicJobIdGenerator:
    """Job ID generator that returns a predetermined JobId."""
    def __init__(self, job_id: JobId):
        self._job_id = job_id

    def generate(self) -> JobId:
        """Return the predetermined JobId."""
        return self._job_id


class _SequenceJobIdGenerator:
    """Job ID generator that returns JobIds from a list in sequence."""
    def __init__(self, job_ids: list[JobId]):
        self._job_ids = job_ids

    def generate(self) -> JobId:
        """Return the next JobId from the sequence."""
        return self._job_ids.pop(0)


class TestCreateJobUseCase:
    """Tests for CreateJobUseCase."""

    def test_create_job_success(
        self,
        job_repo,
        stage_repo,
        idempotency_repo,
        audit_repo,
        _job_id_generator,
        uuid_generator,
    ):
        """Job should be created with all initial stages."""
        generated_job_id = JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11")
        use_case = CreateJobUseCase(
            job_repo,
            stage_repo,
            idempotency_repo,
            audit_repo,
            job_id_generator=_DeterministicJobIdGenerator(generated_job_id),
            uuid_generator=uuid_generator,
        )
        command = CreateJobCommand(
            client_id=ClientId("client-1"),
            request_client_id="req-client-123",
            client_name="abc123def456",
            correlation_id=CorrelationId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a12"),
            idempotency_key=IdempotencyKey("idem-key-1"),
        )
        response = use_case.execute(command)
        assert response.job_id == "018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11"
        assert response.client_id == "client-1"
        assert response.client_name == "abc123def456"
        assert response.job_state == JobState.CREATED.value
        assert response.version == 1
        assert response.tombstoned is False

    def test_create_job_persists_job(
        self,
        job_repo,
        stage_repo,
        idempotency_repo,
        audit_repo,
        _job_id_generator,
        uuid_generator,
    ):
        """Job should be persisted to repository."""
        generated_job_id = JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11")
        use_case = CreateJobUseCase(
            job_repo,
            stage_repo,
            idempotency_repo,
            audit_repo,
            job_id_generator=_DeterministicJobIdGenerator(generated_job_id),
            uuid_generator=uuid_generator,
        )
        command = CreateJobCommand(
            client_id=ClientId("client-1"),
            request_client_id="req-client-123",
            client_name="abc123def456",
            correlation_id=CorrelationId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a12"),
            idempotency_key=IdempotencyKey("idem-key-1"),
        )
        response = use_case.execute(command)
        saved_job = job_repo.find_by_id(JobId(response.job_id))
        assert saved_job is not None
        assert saved_job.job_id == JobId(response.job_id)
        assert saved_job.client_id == command.client_id
        assert saved_job.job_state == JobState.CREATED

    def test_create_job_creates_all_stages(
        self,
        job_repo,
        stage_repo,
        idempotency_repo,
        audit_repo,
        _job_id_generator,
        uuid_generator,
    ):
        """All 9 initial stages should be created in PENDING state."""
        generated_job_id = JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11")
        use_case = CreateJobUseCase(
            job_repo,
            stage_repo,
            idempotency_repo,
            audit_repo,
            job_id_generator=_DeterministicJobIdGenerator(generated_job_id),
            uuid_generator=uuid_generator,
        )
        command = CreateJobCommand(
            client_id=ClientId("client-1"),
            request_client_id="req-client-123",
            client_name="abc123def456",
            correlation_id=CorrelationId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a12"),
            idempotency_key=IdempotencyKey("idem-key-1"),
        )
        response = use_case.execute(command)
        job_id = JobId(response.job_id)
        stages = stage_repo.find_all_by_job(job_id)
        assert len(stages) == len(StageType)

        stage_names = {stage.stage_name.value for stage in stages}
        expected_names = {stage_type.value for stage_type in StageType}
        assert stage_names == expected_names
        for stage in stages:
            assert stage.stage_state == StageState.PENDING
            assert stage.attempt == 1
            assert stage.job_id == job_id

    def test_create_job_saves_idempotency_record(
        self,
        job_repo,
        stage_repo,
        idempotency_repo,
        audit_repo,
        _job_id_generator,
        uuid_generator,
    ):
        """Idempotency record should be saved."""
        generated_job_id = JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11")
        use_case = CreateJobUseCase(
            job_repo,
            stage_repo,
            idempotency_repo,
            audit_repo,
            job_id_generator=_DeterministicJobIdGenerator(generated_job_id),
            uuid_generator=uuid_generator,
        )
        command = CreateJobCommand(
            client_id=ClientId("client-1"),
            request_client_id="req-client-123",
            client_name="abc123def456",
            correlation_id=CorrelationId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a12"),
            idempotency_key=IdempotencyKey("idem-key-1"),
        )
        response = use_case.execute(command)
        record = idempotency_repo.find_by_key(command.idempotency_key)
        assert record is not None
        assert record.idempotency_key == command.idempotency_key
        assert record.client_id == command.client_id
        assert record.job_id == JobId(response.job_id)

    def test_create_job_emits_audit_event(
        self,
        job_repo,
        stage_repo,
        idempotency_repo,
        audit_repo,
        _job_id_generator,
        uuid_generator,
    ):
        """JOB_CREATED audit event should be emitted."""
        generated_job_id = JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11")
        use_case = CreateJobUseCase(
            job_repo,
            stage_repo,
            idempotency_repo,
            audit_repo,
            job_id_generator=_DeterministicJobIdGenerator(generated_job_id),
            uuid_generator=uuid_generator,
        )
        command = CreateJobCommand(
            client_id=ClientId("client-1"),
            request_client_id="req-client-123",
            client_name="abc123def456",
            correlation_id=CorrelationId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a12"),
            idempotency_key=IdempotencyKey("idem-key-1"),
        )
        response = use_case.execute(command)
        job_id = JobId(response.job_id)
        events = audit_repo.find_by_job(job_id)
        assert len(events) == 1
        assert events[0].event_type == "JOB_CREATED"
        assert events[0].job_id == job_id
        assert events[0].correlation_id == command.correlation_id
        assert events[0].client_id == command.client_id

    def test_idempotent_retry_returns_existing_job(
        self,
        job_repo,
        stage_repo,
        idempotency_repo,
        audit_repo,
        _job_id_generator,
        uuid_generator,
    ):
        """Duplicate idempotency key with same fingerprint returns existing job."""
        generated_job_id = JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11")
        use_case = CreateJobUseCase(
            job_repo,
            stage_repo,
            idempotency_repo,
            audit_repo,
            job_id_generator=_DeterministicJobIdGenerator(generated_job_id),
            uuid_generator=uuid_generator,
        )
        command = CreateJobCommand(
            client_id=ClientId("client-1"),
            request_client_id="req-client-123",
            client_name="abc123def456",
            correlation_id=CorrelationId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a12"),
            idempotency_key=IdempotencyKey("idem-key-1"),
        )
        first_response = use_case.execute(command)
        second_response = use_case.execute(command)
        assert first_response.job_id == second_response.job_id
        assert first_response.version == second_response.version
        stages = stage_repo.find_all_by_job(JobId(first_response.job_id))
        assert len(stages) == len(StageType)

        events = audit_repo.find_by_job(JobId(first_response.job_id))
        assert len(events) == 1

    def test_idempotency_conflict_raises_error(
        self,
        job_repo,
        stage_repo,
        idempotency_repo,
        audit_repo,
        _job_id_generator,
        uuid_generator,
    ):
        """Same idempotency key with different fingerprint raises conflict."""
        first_job_id = JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11")
        second_job_id = JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a13")
        generator = _SequenceJobIdGenerator([first_job_id, second_job_id])

        use_case = CreateJobUseCase(
            job_repo,
            stage_repo,
            idempotency_repo,
            audit_repo,
            job_id_generator=generator,
            uuid_generator=uuid_generator,
        )
        first_command = CreateJobCommand(
            client_id=ClientId("client-1"),
            request_client_id="req-client-123",
            client_name="abc123def456",
            correlation_id=CorrelationId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a12"),
            idempotency_key=IdempotencyKey("idem-key-1"),
        )
        second_command = CreateJobCommand(
            client_id=ClientId("client-2"),
            request_client_id="req-client-456",
            client_name="different-digest",
            correlation_id=CorrelationId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a14"),
            idempotency_key=IdempotencyKey("idem-key-1"),
        )
        use_case.execute(first_command)
        with pytest.raises(IdempotencyConflictError) as exc_info:
            use_case.execute(second_command)

        assert exc_info.value.idempotency_key == "idem-key-1"
        assert exc_info.value.existing_job_id == str(first_job_id)
        assert exc_info.value.correlation_id == str(second_command.correlation_id)

    def test_job_already_exists_raises_error(
        self,
        job_repo,
        stage_repo,
        idempotency_repo,
        audit_repo,
        _job_id_generator,
        uuid_generator,
    ):
        """Creating job with existing job_id raises error."""
        generated_job_id = JobId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11")
        use_case = CreateJobUseCase(
            job_repo,
            stage_repo,
            idempotency_repo,
            audit_repo,
            job_id_generator=_DeterministicJobIdGenerator(generated_job_id),
            uuid_generator=uuid_generator,
        )
        first_command = CreateJobCommand(
            client_id=ClientId("client-1"),
            request_client_id="req-client-123",
            client_name="abc123def456",
            correlation_id=CorrelationId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a12"),
            idempotency_key=IdempotencyKey("idem-key-1"),
        )
        second_command = CreateJobCommand(
            client_id=ClientId("client-1"),
            request_client_id="req-client-123",
            client_name="abc123def456",
            correlation_id=CorrelationId("018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a13"),
            idempotency_key=IdempotencyKey("idem-key-2"),
        )
        use_case.execute(first_command)
        with pytest.raises(JobAlreadyExistsError) as exc_info:
            use_case.execute(second_command)

        assert exc_info.value.job_id == "018f3c4c-6a2e-7b2a-9c2a-3d8d2c4b9a11"
        assert exc_info.value.correlation_id == str(second_command.correlation_id)


================================================
FILE: build_stream/tests/unit/orchestrator/local_repo/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

================================================
FILE: build_stream/tests/unit/orchestrator/local_repo/test_commands.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for CreateLocalRepoCommand."""

import uuid

import pytest

from core.jobs.value_objects import ClientId, CorrelationId, JobId
from orchestrator.local_repo.commands import CreateLocalRepoCommand


class TestCreateLocalRepoCommand:
    """Tests for CreateLocalRepoCommand."""

    @pytest.fixture
    def valid_command_data(self):
        """Provide valid command data."""
        return {
            "job_id": JobId(str(uuid.uuid4())),
            "client_id": ClientId("test-client-123"),
            "correlation_id": CorrelationId(str(uuid.uuid4())),
        }

    def test_create_command_with_valid_data(self, valid_command_data):
        """Test creating command with valid data."""
        command = CreateLocalRepoCommand(**valid_command_data)

        assert command.job_id == valid_command_data["job_id"]
        assert command.client_id == valid_command_data["client_id"]
        assert command.correlation_id == valid_command_data["correlation_id"]

    def test_command_is_immutable(self, valid_command_data):
        """Test that command is immutable."""
        command = CreateLocalRepoCommand(**valid_command_data)

        # Attempting to modify should raise AttributeError
        with pytest.raises(AttributeError):
            command.job_id = JobId(str(uuid.uuid4()))

        with pytest.raises(AttributeError):
            command.client_id = ClientId("other-client")

        with pytest.raises(AttributeError):
            command.correlation_id = CorrelationId(str(uuid.uuid4()))

    def test_command_equality(self, valid_command_data):
        """Test command equality."""
        command1 = CreateLocalRepoCommand(**valid_command_data)
        command2 = CreateLocalRepoCommand(**valid_command_data)

        assert command1 == command2
        assert hash(command1) == hash(command2)

    def test_command_inequality(self, valid_command_data):
        """Test command inequality."""
        command1 = CreateLocalRepoCommand(**valid_command_data)

        # Different job_id
        different_data = valid_command_data.copy()
        different_data["job_id"] = JobId(str(uuid.uuid4()))
        command2 = CreateLocalRepoCommand(**different_data)

        assert command1 != command2
        assert hash(command1) != hash(command2)

    def test_command_repr(self, valid_command_data):
        """Test command string representation."""
        command = CreateLocalRepoCommand(**valid_command_data)

        repr_str = repr(command)
        assert "CreateLocalRepoCommand" in repr_str
        assert str(valid_command_data["job_id"]) in repr_str
        assert str(valid_command_data["client_id"]) in repr_str
        assert str(valid_command_data["correlation_id"]) in repr_str

    def test_command_with_none_correlation_id(self):
        """Test creating command with None correlation_id."""
        command = CreateLocalRepoCommand(
            job_id=JobId(str(uuid.uuid4())),
            client_id=ClientId("test-client"),
            correlation_id=None,
        )

        assert command.correlation_id is None

    def test_command_accepts_valid_value_objects(self, valid_command_data):
        """Test that command accepts properly validated value objects."""
        command = CreateLocalRepoCommand(**valid_command_data)

        assert command.job_id == valid_command_data["job_id"]
        assert command.client_id == valid_command_data["client_id"]
        assert command.correlation_id == valid_command_data["correlation_id"]


================================================
FILE: build_stream/tests/unit/orchestrator/local_repo/test_dtos.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for LocalRepoResponse DTO."""

import uuid
from datetime import datetime, timezone

import pytest

from orchestrator.local_repo.dtos import LocalRepoResponse


class TestLocalRepoResponse:
    """Tests for LocalRepoResponse."""

    @pytest.fixture
    def valid_response_data(self):
        """Provide valid response data."""
        return {
            "job_id": str(uuid.uuid4()),
            "stage_name": "create-local-repository",
            "status": "accepted",
            "submitted_at": datetime.now(timezone.utc).isoformat(),
            "correlation_id": str(uuid.uuid4()),
        }

    def test_create_response_with_valid_data(self, valid_response_data):
        """Test creating response with valid data."""
        response = LocalRepoResponse(**valid_response_data)

        assert response.job_id == valid_response_data["job_id"]
        assert response.stage_name == valid_response_data["stage_name"]
        assert response.status == valid_response_data["status"]
        assert response.submitted_at == valid_response_data["submitted_at"]
        assert response.correlation_id == valid_response_data["correlation_id"]

    def test_response_is_immutable(self, valid_response_data):
        """Test that response is immutable."""
        response = LocalRepoResponse(**valid_response_data)

        # Attempting to modify should raise AttributeError
        with pytest.raises(AttributeError):
            response.job_id = str(uuid.uuid4())

        with pytest.raises(AttributeError):
            response.stage_name = "other-stage"

        with pytest.raises(AttributeError):
            response.status = "completed"

        with pytest.raises(AttributeError):
            response.submitted_at = datetime.now(timezone.utc).isoformat()

        with pytest.raises(AttributeError):
            response.correlation_id = str(uuid.uuid4())


    def test_response_equality(self, valid_response_data):
        """Test response equality."""
        response1 = LocalRepoResponse(**valid_response_data)
        response2 = LocalRepoResponse(**valid_response_data)

        assert response1 == response2
        assert hash(response1) == hash(response2)

    def test_response_inequality(self, valid_response_data):
        """Test response inequality."""
        response1 = LocalRepoResponse(**valid_response_data)

        # Different job_id
        different_data = valid_response_data.copy()
        different_data["job_id"] = str(uuid.uuid4())
        response2 = LocalRepoResponse(**different_data)

        assert response1 != response2
        assert hash(response1) != hash(response2)

    def test_response_from_domain_entities(self):
        """Test creating response from domain entities."""
        job_id = str(uuid.uuid4())
        stage_name = "create-local-repository"
        status = "accepted"
        submitted_at = datetime.now(timezone.utc).isoformat()
        correlation_id = str(uuid.uuid4())

        response = LocalRepoResponse(
            job_id=job_id,
            stage_name=stage_name,
            status=status,
            submitted_at=submitted_at,
            correlation_id=correlation_id,
        )

        assert isinstance(response.job_id, str)
        assert isinstance(response.stage_name, str)
        assert isinstance(response.status, str)
        assert isinstance(response.submitted_at, str)
        assert isinstance(response.correlation_id, str)

    def test_response_with_different_statuses(self, valid_response_data):
        """Test response with different status values."""
        for status in ["pending", "accepted", "running"]:
            valid_response_data["status"] = status
            response = LocalRepoResponse(**valid_response_data)
            assert response.status == status

    def test_response_repr(self, valid_response_data):
        """Test response string representation."""
        response = LocalRepoResponse(**valid_response_data)

        repr_str = repr(response)
        assert "LocalRepoResponse" in repr_str
        assert valid_response_data["job_id"] in repr_str
        assert valid_response_data["stage_name"] in repr_str
        assert valid_response_data["status"] in repr_str


================================================
FILE: build_stream/tests/unit/orchestrator/local_repo/test_result_poller.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for LocalRepoResultPoller."""

import asyncio
import uuid
from unittest.mock import MagicMock

import pytest

from core.jobs.entities import Stage
from core.jobs.value_objects import (
    JobId,
    StageName,
    StageState,
)
from core.localrepo.entities import PlaybookResult
from orchestrator.local_repo.result_poller import LocalRepoResultPoller


@pytest.fixture
def mock_result_service_fixture():
    """Mock PlaybookQueueResultService."""
    service = MagicMock()
    service.poll_results = MagicMock(return_value=0)
    return service


@pytest.fixture
def mock_stage_repo_fixture():
    """Mock StageRepository."""
    repo = MagicMock()
    return repo


@pytest.fixture
def mock_audit_repo_fixture():
    """Mock AuditEventRepository."""
    repo = MagicMock()
    return repo


@pytest.fixture
def mock_uuid_generator_fixture():
    """Mock UUID generator."""
    generator = MagicMock()
    generator.generate.return_value = str(uuid.uuid4())
    return generator


@pytest.fixture
def mock_job_repo_fixture():
    """Mock JobRepository."""
    repo = MagicMock()
    return repo


@pytest.fixture
def result_poller(
    mock_result_service_fixture, mock_job_repo_fixture, mock_stage_repo_fixture,
    mock_audit_repo_fixture, mock_uuid_generator_fixture
):
    """Create LocalRepoResultPoller instance with mocked dependencies."""
    return LocalRepoResultPoller(
        result_service=mock_result_service_fixture,
        job_repo=mock_job_repo_fixture,
        stage_repo=mock_stage_repo_fixture,
        audit_repo=mock_audit_repo_fixture,
        uuid_generator=mock_uuid_generator_fixture,
        poll_interval=1,
    )


class TestLocalRepoResultPoller:
    """Tests for LocalRepoResultPoller."""

    @pytest.mark.asyncio
    async def test_start_starts_polling(self, result_poller, mock_result_service_fixture):
        """Test that start() begins the polling loop."""
        mock_result_service_fixture.poll_results.return_value = 0

        await result_poller.start()
        assert result_poller._running
        await result_poller.stop()

    @pytest.mark.asyncio
    async def test_stop_stops_polling(self, result_poller, mock_result_service_fixture):
        """Test that stop() stops the polling loop."""
        mock_result_service_fixture.poll_results.return_value = 0

        await result_poller.start()
        await result_poller.stop()
        assert not result_poller._running

    @pytest.mark.asyncio
    async def test_poll_loop_calls_poll_results(self, result_poller, mock_result_service_fixture):
        """Test that poll loop calls poll_results with callback."""
        mock_result_service_fixture.poll_results.return_value = 1

        # Start and let it run once
        await result_poller.start()

        # Give it a moment to poll
        await asyncio.sleep(0.1)

        await result_poller.stop()

        # Verify poll_results was called with a callback
        mock_result_service_fixture.poll_results.assert_called()
        callback_arg = mock_result_service_fixture.poll_results.call_args[1]["callback"]
        assert callable(callback_arg)

    def test_on_result_received_success(self, result_poller, mock_stage_repo_fixture, mock_audit_repo_fixture):
        """Test handling successful result."""
        # Setup stage
        job_id = str(uuid.uuid4())
        stage_name = "create-local-repository"
        stage = Stage(
            job_id=JobId(job_id),
            stage_name=StageName(stage_name),
            stage_state=StageState.IN_PROGRESS,
        )
        mock_stage_repo_fixture.find_by_job_and_name.return_value = stage

        # Create result
        result = PlaybookResult(
            job_id=job_id,
            stage_name=stage_name,
            request_id="req-123",
            status="success",
            exit_code=0,
            duration_seconds=30,
        )

        # Handle result
        result_poller._on_result_received(result)

        # Verify stage was completed
        assert stage.stage_state == StageState.COMPLETED
        mock_stage_repo_fixture.save.assert_called_once_with(stage)

        # Verify audit event was created
        mock_audit_repo_fixture.save.assert_called_once()
        audit_event = mock_audit_repo_fixture.save.call_args[0][0]
        assert audit_event.event_type == "STAGE_COMPLETED"
        assert audit_event.job_id == job_id

    def test_on_result_received_failure(self, result_poller, mock_stage_repo_fixture, mock_audit_repo_fixture):
        """Test handling failed result."""
        # Setup stage
        job_id = str(uuid.uuid4())
        stage_name = "create-local-repository"
        stage = Stage(
            job_id=JobId(job_id),
            stage_name=StageName(stage_name),
            stage_state=StageState.IN_PROGRESS,
        )
        mock_stage_repo_fixture.find_by_job_and_name.return_value = stage

        # Create failed result
        result = PlaybookResult(
            job_id=job_id,
            stage_name=stage_name,
            request_id="req-123",
            status="failed",
            exit_code=1,
            error_code="PLAYBOOK_FAILED",
            error_summary="Playbook execution failed",
            duration_seconds=30,
        )

        # Handle result
        result_poller._on_result_received(result)

        # Verify stage was failed
        assert stage.stage_state == StageState.FAILED
        assert stage.error_code == "PLAYBOOK_FAILED"
        assert stage.error_summary == "Playbook execution failed"
        mock_stage_repo_fixture.save.assert_called_once_with(stage)

        # Verify audit event was created
        mock_audit_repo_fixture.save.assert_called_once()
        audit_event = mock_audit_repo_fixture.save.call_args[0][0]
        assert audit_event.event_type == "STAGE_FAILED"

    def test_on_result_received_stage_not_found(self, result_poller, mock_stage_repo_fixture, mock_audit_repo_fixture):
        """Test handling result when stage is not found."""
        # Setup stage not found
        mock_stage_repo_fixture.find_by_job_and_name.return_value = None

        # Create result
        result = PlaybookResult(
            job_id=str(uuid.uuid4()),
            stage_name="create-local-repository",
            request_id="req-123",
            status="success",
            exit_code=0,
        )

        # Handle result
        result_poller._on_result_received(result)

        # Verify nothing was saved
        mock_stage_repo_fixture.save.assert_not_called()
        mock_audit_repo_fixture.save.assert_not_called()

    def test_on_result_received_handles_exceptions(self, result_poller, mock_stage_repo_fixture, mock_audit_repo_fixture):
        """Test that exceptions in result handling are caught."""
        # Setup stage to raise exception
        mock_stage_repo_fixture.find_by_job_and_name.side_effect = Exception("Database error")

        # Create result
        result = PlaybookResult(
            job_id=str(uuid.uuid4()),
            stage_name="create-local-repository",
            request_id="req-123",
            status="success",
            exit_code=0,
        )

        # Should not raise exception
        result_poller._on_result_received(result)

        # Verify nothing was saved due to exception
        mock_stage_repo_fixture.save.assert_not_called()
        mock_audit_repo_fixture.save.assert_not_called()

    @pytest.mark.asyncio
    async def test_poll_loop_handles_exceptions(self, result_poller, mock_result_service_fixture):
        """Test that exceptions in poll loop are caught."""
        # Setup poll_results to raise exception
        mock_result_service_fixture.poll_results.side_effect = Exception("Queue error")

        # Should not raise exception
        await result_poller.start()

        # Give it a moment to poll and encounter error
        await asyncio.sleep(0.1)

        await result_poller.stop()
        assert not result_poller._running


================================================
FILE: build_stream/tests/unit/orchestrator/local_repo/test_use_case.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for CreateLocalRepoUseCase."""

import uuid
from pathlib import Path
from unittest.mock import MagicMock

import pytest

from core.jobs.entities import Job, Stage
from core.jobs.exceptions import JobNotFoundError, UpstreamStageNotCompletedError
from core.jobs.value_objects import (
    ClientId,
    CorrelationId,
    JobId,
    StageName,
    StageState,
    StageType,
)
from core.localrepo.exceptions import InputFilesMissingError
from orchestrator.local_repo.commands import CreateLocalRepoCommand
from orchestrator.local_repo.use_cases import CreateLocalRepoUseCase


@pytest.fixture(name="job_id")
def job_id_fixture():
    """Provide a valid JobId."""
    return JobId(str(uuid.uuid4()))


@pytest.fixture(name="client_id")
def client_id_fixture():
    """Provide a valid ClientId."""
    return ClientId("test-client-123")


@pytest.fixture(name="correlation_id")
def correlation_id_fixture():
    """Provide a valid CorrelationId."""
    return CorrelationId(str(uuid.uuid4()))


@pytest.fixture(name="job")
def job_fixture(job_id, client_id):
    """Provide a Job entity."""
    return Job(
        job_id=job_id,
        client_id=client_id,
        request_client_id="client-123",
    )


@pytest.fixture(name="stage")
def stage_fixture(job_id):
    """Provide a Stage entity in PENDING state."""
    return Stage(
        job_id=job_id,
        stage_name=StageName(StageType.CREATE_LOCAL_REPOSITORY.value),
    )


@pytest.fixture(name="command")
def command_fixture(job_id, client_id, correlation_id):
    """Provide a CreateLocalRepoCommand."""
    return CreateLocalRepoCommand(
        job_id=job_id,
        client_id=client_id,
        correlation_id=correlation_id,
    )


@pytest.fixture(name="upstream_stage")
def upstream_stage_fixture(job_id):
    """Provide a COMPLETED generate-input-files stage (upstream prerequisite)."""
    upstream = Stage(
        job_id=job_id,
        stage_name=StageName(StageType.GENERATE_INPUT_FILES.value),
    )
    upstream.start()
    upstream.complete()
    return upstream


@pytest.fixture(name="use_case")
def use_case_fixture(job, stage, upstream_stage):
    """Provide a CreateLocalRepoUseCase with mocked dependencies."""
    job_repo = MagicMock()
    job_repo.find_by_id.return_value = job

    stage_repo = MagicMock()

    def _find_by_job_and_name(job_id_arg, stage_name_arg):
        if stage_name_arg.value == StageType.GENERATE_INPUT_FILES.value:
            return upstream_stage
        if stage_name_arg.value == StageType.CREATE_LOCAL_REPOSITORY.value:
            return stage
        return None

    stage_repo.find_by_job_and_name.side_effect = _find_by_job_and_name

    audit_repo = MagicMock()

    input_file_service = MagicMock()
    input_file_service.prepare_playbook_input.return_value = True

    playbook_queue_service = MagicMock()
    playbook_queue_service.submit_request.return_value = Path("/queue/requests/test.json")

    uuid_generator = MagicMock()
    uuid_generator.generate.return_value = uuid.uuid4()

    use_case = CreateLocalRepoUseCase(
        job_repo=job_repo,
        stage_repo=stage_repo,
        audit_repo=audit_repo,
        input_file_service=input_file_service,
        playbook_queue_service=playbook_queue_service,
        uuid_generator=uuid_generator,
    )
    use_case._job_repo = job_repo
    use_case._stage_repo = stage_repo
    use_case._audit_repo = audit_repo
    use_case._input_file_service = input_file_service
    use_case._playbook_queue_service = playbook_queue_service
    return use_case


class TestCreateLocalRepoUseCase:
    """Tests for CreateLocalRepoUseCase."""

    def test_execute_success(self, use_case, command):
        """Successful execution should return accepted response."""
        result = use_case.execute(command)

        assert result.status == "accepted"
        assert result.stage_name == "create-local-repository"
        assert result.job_id == str(command.job_id)
        assert result.correlation_id == str(command.correlation_id)

    def test_execute_updates_stage_to_running(self, use_case, command):
        """Stage should transition to IN_PROGRESS on success."""
        use_case.execute(command)
        use_case._stage_repo.save.assert_called()

    def test_execute_submits_request(self, use_case, command):
        """Request should be submitted to the queue."""
        use_case.execute(command)
        use_case._playbook_queue_service.submit_request.assert_called_once()

    def test_execute_emits_audit_event(self, use_case, command):
        """Audit event should be emitted."""
        use_case.execute(command)
        use_case._audit_repo.save.assert_called_once()

    def test_execute_job_not_found(self, use_case, command):
        """Missing job should raise JobNotFoundError."""
        use_case._job_repo.find_by_id.return_value = None

        with pytest.raises(JobNotFoundError):
            use_case.execute(command)

    def test_execute_tombstoned_job(self, use_case, command, job):
        """Tombstoned job should raise JobNotFoundError."""
        job.tombstone()
        use_case._job_repo.find_by_id.return_value = job

        with pytest.raises(JobNotFoundError):
            use_case.execute(command)

    def test_execute_wrong_client(self, use_case, command, job):
        """Job owned by different client should raise JobNotFoundError."""
        job.client_id = ClientId("other-client")
        use_case._job_repo.find_by_id.return_value = job

        with pytest.raises(JobNotFoundError):
            use_case.execute(command)

    def test_execute_stage_not_found(self, use_case, command, upstream_stage):
        """Missing stage should raise error."""
        def _find_upstream_only(job_id_arg, stage_name_arg):
            if stage_name_arg.value == StageType.GENERATE_INPUT_FILES.value:
                return upstream_stage
            return None

        use_case._stage_repo.find_by_job_and_name.side_effect = _find_upstream_only

        with pytest.raises(JobNotFoundError):
            use_case.execute(command)

    def test_execute_input_files_missing(self, use_case, command):
        """Missing input files should raise and fail the stage."""
        use_case._input_file_service.prepare_playbook_input.side_effect = (
            InputFilesMissingError(
                job_id=str(command.job_id),
                input_path="/opt/omnia/build_stream/job-1/input",
            )
        )

        with pytest.raises(InputFilesMissingError):
            use_case.execute(command)

        use_case._stage_repo.save.assert_called()
        use_case._playbook_queue_service.submit_request.assert_not_called()


================================================
FILE: build_stream/tests/unit/orchestrator/validate/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for validate orchestrator module."""


================================================
FILE: build_stream/tests/unit/orchestrator/validate/test_validate_image_on_test_use_case.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Unit tests for ValidateImageOnTestUseCase."""

import uuid

import pytest

from core.jobs.entities import Job, Stage
from core.jobs.exceptions import (
    JobNotFoundError,
    UpstreamStageNotCompletedError,
)
from core.jobs.value_objects import (
    ClientId,
    CorrelationId,
    JobId,
    JobState,
    StageName,
    StageState,
    StageType,
)
from core.validate.exceptions import (
    ValidationExecutionError,
)
from orchestrator.validate.commands import ValidateImageOnTestCommand
from orchestrator.validate.use_cases import ValidateImageOnTestUseCase


# --- Helpers ---

def _uuid() -> str:
    return str(uuid.uuid4())


def _make_job(job_id: JobId, client_id: ClientId) -> Job:
    job = Job(
        job_id=job_id,
        client_id=client_id,
        request_client_id="req-client-123",
        job_state=JobState.IN_PROGRESS,
    )
    return job


def _make_stage(
    job_id: JobId,
    stage_type: StageType,
    state: StageState = StageState.PENDING,
) -> Stage:
    return Stage(
        job_id=job_id,
        stage_name=StageName(stage_type.value),
        stage_state=state,
        attempt=1,
    )


def _make_command(
    job_id: JobId | None = None,
    client_id: ClientId | None = None,
) -> ValidateImageOnTestCommand:
    return ValidateImageOnTestCommand(
        job_id=job_id or JobId(_uuid()),
        client_id=client_id or ClientId("test-client"),
        correlation_id=CorrelationId(_uuid()),
        image_key="test-image",
    )


# --- Mock repositories ---

class MockJobRepo:
    """Mock job repository for testing."""
    # pylint: disable=too-few-public-methods

    def __init__(self):
        """Initialize mock job repository."""
        self._jobs = {}

    def save(self, job: Job) -> None:
        """Save job to repository."""
        self._jobs[str(job.job_id)] = job

    def find_by_id(self, job_id):
        """Find job by ID."""
        key = str(job_id) if not isinstance(job_id, str) else job_id
        return self._jobs.get(key)

    def exists(self, job_id) -> bool:
        """Check if job exists."""
        key = str(job_id) if not isinstance(job_id, str) else job_id
        return key in self._jobs


class MockStageRepo:
    """Mock stage repository for testing."""
    # pylint: disable=too-few-public-methods

    def __init__(self):
        """Initialize mock stage repository."""
        self._stages = {}

    def save(self, stage: Stage) -> None:
        """Save stage to repository."""
        key = (str(stage.job_id), str(stage.stage_name))
        self._stages[key] = stage

    def save_all(self, stages) -> None:
        """Save multiple stages."""
        for s in stages:
            self.save(s)

    def find_by_job_and_name(self, job_id, stage_name):
        """Find stage by job ID and stage name."""
        key = (str(job_id), str(stage_name))
        return self._stages.get(key)

    def find_all_by_job(self, job_id):
        """Find all stages for a job."""
        jid = str(job_id)
        return [s for k, s in self._stages.items() if k[0] == jid]


class MockAuditRepo:
    """Mock audit repository for testing."""
    # pylint: disable=too-few-public-methods

    def __init__(self):
        """Initialize mock audit repository."""
        self._events = []

    def save(self, event) -> None:
        """Save event to repository."""
        self._events.append(event)

    def find_by_job(self, job_id):
        """Find events by job ID."""
        jid = str(job_id)
        return [e for e in self._events if str(e.job_id) == jid]


class MockUUIDGenerator:
    """Mock UUID generator for testing."""
    # pylint: disable=too-few-public-methods

    def generate(self):
        """Generate a UUID."""
        return uuid.uuid4()


class MockQueueService:
    """Mock queue service for testing."""
    # pylint: disable=too-few-public-methods

    def __init__(self, should_fail: bool = False):
        """Initialize mock queue service."""
        self.submitted = []
        self.should_fail = should_fail

    def submit_request(self, request, correlation_id):
        """Submit request to queue."""
        if self.should_fail:
            raise IOError("Queue unavailable")
        self.submitted.append(request)


# --- Fixtures ---

@pytest.fixture
def job_repo():
    """Provide mock job repository."""
    return MockJobRepo()


@pytest.fixture
def stage_repo():
    """Provide mock stage repository."""
    return MockStageRepo()


@pytest.fixture
def audit_repo():
    """Provide mock audit repository."""
    return MockAuditRepo()


@pytest.fixture
def uuid_gen():
    """Provide mock UUID generator."""
    return MockUUIDGenerator()


@pytest.fixture
def queue_service():
    """Provide mock queue service."""
    return MockQueueService()


def _build_use_case(job_repo, stage_repo, audit_repo, queue_service, uuid_gen):
    """Build use case with mocked dependencies."""
    return ValidateImageOnTestUseCase(
        job_repo=job_repo,
        stage_repo=stage_repo,
        audit_repo=audit_repo,
        queue_service=queue_service,
        uuid_generator=uuid_gen,
    )


# --- Tests ---

class TestValidateImageOnTestUseCase:
    """Tests for ValidateImageOnTestUseCase."""

    def test_execute_success(
        self, job_repo, stage_repo, audit_repo, queue_service, uuid_gen
    ):
        """Successful execution should submit to queue and return response."""
        # pylint: disable=too-many-arguments, redefined-outer-name
        job_id = JobId(_uuid())
        client_id = ClientId("test-client")

        # Setup: job, validate stage, and a completed build-image stage
        job = _make_job(job_id, client_id)
        job_repo.save(job)

        validate_stage = _make_stage(job_id, StageType.VALIDATE_IMAGE_ON_TEST)
        stage_repo.save(validate_stage)

        build_stage = _make_stage(
            job_id, StageType.BUILD_IMAGE_X86_64, StageState.COMPLETED
        )
        stage_repo.save(build_stage)

        command = _make_command(job_id=job_id, client_id=client_id)
        use_case = _build_use_case(
            job_repo, stage_repo, audit_repo, queue_service, uuid_gen
        )

        result = use_case.execute(command)

        assert result.job_id == str(job_id)
        assert result.stage_name == "validate-image-on-test"
        assert result.status == "accepted"
        assert len(queue_service.submitted) == 1
        assert len(audit_repo.find_by_job(job_id)) == 1

    def test_execute_with_aarch64_completed(
        self, job_repo, stage_repo, audit_repo, queue_service, uuid_gen
    ):
        """Should succeed when aarch64 build stage is completed."""
        # pylint: disable=too-many-arguments, redefined-outer-name
        job_id = JobId(_uuid())
        client_id = ClientId("test-client")

        job = _make_job(job_id, client_id)
        job_repo.save(job)

        validate_stage = _make_stage(job_id, StageType.VALIDATE_IMAGE_ON_TEST)
        stage_repo.save(validate_stage)

        build_stage = _make_stage(
            job_id, StageType.BUILD_IMAGE_AARCH64, StageState.COMPLETED
        )
        stage_repo.save(build_stage)

        command = _make_command(job_id=job_id, client_id=client_id)
        use_case = _build_use_case(
            job_repo, stage_repo, audit_repo, queue_service, uuid_gen
        )

        result = use_case.execute(command)
        assert result.status == "accepted"

    def test_execute_job_not_found(
        self, job_repo, stage_repo, audit_repo, queue_service, uuid_gen
    ):
        """Should raise JobNotFoundError when job does not exist."""
        # pylint: disable=too-many-arguments, redefined-outer-name
        command = _make_command()
        use_case = _build_use_case(
            job_repo, stage_repo, audit_repo, queue_service, uuid_gen
        )

        with pytest.raises(JobNotFoundError):
            use_case.execute(command)

    def test_execute_client_mismatch(
        self, job_repo, stage_repo, audit_repo, queue_service, uuid_gen
    ):
        """Should raise JobNotFoundError when client doesn't own the job."""
        # pylint: disable=too-many-arguments, redefined-outer-name
        job_id = JobId(_uuid())
        job = _make_job(job_id, ClientId("owner-client"))
        job_repo.save(job)

        command = _make_command(job_id=job_id, client_id=ClientId("other-client"))
        use_case = _build_use_case(
            job_repo, stage_repo, audit_repo, queue_service, uuid_gen
        )

        with pytest.raises(JobNotFoundError):
            use_case.execute(command)

    def test_execute_stage_not_found(
        self, job_repo, stage_repo, audit_repo, queue_service, uuid_gen
    ):
        """Should raise JobNotFoundError when validate stage doesn't exist."""
        # pylint: disable=too-many-arguments, redefined-outer-name
        job_id = JobId(_uuid())
        client_id = ClientId("test-client")
        job = _make_job(job_id, client_id)
        job_repo.save(job)

        command = _make_command(job_id=job_id, client_id=client_id)
        use_case = _build_use_case(
            job_repo, stage_repo, audit_repo, queue_service, uuid_gen
        )

        with pytest.raises(JobNotFoundError):
            use_case.execute(command)

    def test_execute_stage_guard_violation_no_build_stages(
        self, job_repo, stage_repo, audit_repo, queue_service, uuid_gen
    ):
        """Should raise UpstreamStageNotCompletedError when no build stage completed."""
        # pylint: disable=too-many-arguments, redefined-outer-name
        job_id = JobId(_uuid())
        client_id = ClientId("test-client")

        job = _make_job(job_id, client_id)
        job_repo.save(job)

        validate_stage = _make_stage(job_id, StageType.VALIDATE_IMAGE_ON_TEST)
        stage_repo.save(validate_stage)

        command = _make_command(job_id=job_id, client_id=client_id)
        use_case = _build_use_case(
            job_repo, stage_repo, audit_repo, queue_service, uuid_gen
        )

        with pytest.raises(UpstreamStageNotCompletedError):
            use_case.execute(command)

    def test_execute_stage_guard_violation_build_pending(
        self, job_repo, stage_repo, audit_repo, queue_service, uuid_gen
    ):
        """Should raise UpstreamStageNotCompletedError when build stage is PENDING."""
        # pylint: disable=too-many-arguments, redefined-outer-name
        job_id = JobId(_uuid())
        client_id = ClientId("test-client")

        job = _make_job(job_id, client_id)
        job_repo.save(job)

        validate_stage = _make_stage(job_id, StageType.VALIDATE_IMAGE_ON_TEST)
        stage_repo.save(validate_stage)

        build_stage = _make_stage(
            job_id, StageType.BUILD_IMAGE_X86_64, StageState.PENDING
        )
        stage_repo.save(build_stage)

        command = _make_command(job_id=job_id, client_id=client_id)
        use_case = _build_use_case(
            job_repo, stage_repo, audit_repo, queue_service, uuid_gen
        )

        with pytest.raises(UpstreamStageNotCompletedError):
            use_case.execute(command)

    def test_execute_queue_failure(
        self, job_repo, stage_repo, audit_repo, uuid_gen
    ):
        """Should raise ValidationExecutionError when queue submission fails."""
        job_id = JobId(_uuid())
        client_id = ClientId("test-client")

        job = _make_job(job_id, client_id)
        job_repo.save(job)

        validate_stage = _make_stage(job_id, StageType.VALIDATE_IMAGE_ON_TEST)
        stage_repo.save(validate_stage)

        build_stage = _make_stage(
            job_id, StageType.BUILD_IMAGE_X86_64, StageState.COMPLETED
        )
        stage_repo.save(build_stage)

        failing_queue = MockQueueService(should_fail=True)
        command = _make_command(job_id=job_id, client_id=client_id)
        use_case = _build_use_case(
            job_repo, stage_repo, audit_repo, failing_queue, uuid_gen
        )

        with pytest.raises(ValidationExecutionError):
            use_case.execute(command)

        # Stage should be marked as FAILED
        saved_stage = stage_repo.find_by_job_and_name(
            job_id, StageName(StageType.VALIDATE_IMAGE_ON_TEST.value)
        )
        assert saved_stage.stage_state == StageState.FAILED

    def test_execute_emits_audit_event(
        self, job_repo, stage_repo, audit_repo, queue_service, uuid_gen
    ):
        """Should emit STAGE_STARTED audit event."""
        job_id = JobId(_uuid())
        client_id = ClientId("test-client")

        job = _make_job(job_id, client_id)
        job_repo.save(job)

        validate_stage = _make_stage(job_id, StageType.VALIDATE_IMAGE_ON_TEST)
        stage_repo.save(validate_stage)

        build_stage = _make_stage(
            job_id, StageType.BUILD_IMAGE_X86_64, StageState.COMPLETED
        )
        stage_repo.save(build_stage)

        command = _make_command(job_id=job_id, client_id=client_id)
        use_case = _build_use_case(
            job_repo, stage_repo, audit_repo, queue_service, uuid_gen
        )
        use_case.execute(command)

        events = audit_repo.find_by_job(job_id)
        assert len(events) == 1
        assert events[0].event_type == "STAGE_STARTED"
        assert events[0].details["stage_name"] == "validate-image-on-test"

    def test_execute_starts_stage(
        self, job_repo, stage_repo, audit_repo, queue_service, uuid_gen
    ):
        """Stage should transition to IN_PROGRESS after submission."""
        job_id = JobId(_uuid())
        client_id = ClientId("test-client")

        job = _make_job(job_id, client_id)
        job_repo.save(job)

        validate_stage = _make_stage(job_id, StageType.VALIDATE_IMAGE_ON_TEST)
        stage_repo.save(validate_stage)

        build_stage = _make_stage(
            job_id, StageType.BUILD_IMAGE_X86_64, StageState.COMPLETED
        )
        stage_repo.save(build_stage)

        command = _make_command(job_id=job_id, client_id=client_id)
        use_case = _build_use_case(
            job_repo, stage_repo, audit_repo, queue_service, uuid_gen
        )
        use_case.execute(command)

        saved_stage = stage_repo.find_by_job_and_name(
            job_id, StageName(StageType.VALIDATE_IMAGE_ON_TEST.value)
        )
        assert saved_stage.stage_state == StageState.IN_PROGRESS

    def test_execute_submits_correct_request(
        self, job_repo, stage_repo, audit_repo, queue_service, uuid_gen
    ):
        """Submitted request should have correct playbook and stage name."""
        job_id = JobId(_uuid())
        client_id = ClientId("test-client")

        job = _make_job(job_id, client_id)
        job_repo.save(job)

        validate_stage = _make_stage(job_id, StageType.VALIDATE_IMAGE_ON_TEST)
        stage_repo.save(validate_stage)

        build_stage = _make_stage(
            job_id, StageType.BUILD_IMAGE_X86_64, StageState.COMPLETED
        )
        stage_repo.save(build_stage)

        command = _make_command(job_id=job_id, client_id=client_id)
        use_case = _build_use_case(
            job_repo, stage_repo, audit_repo, queue_service, uuid_gen
        )
        use_case.execute(command)

        assert len(queue_service.submitted) == 1
        submitted = queue_service.submitted[0]
        assert submitted.stage_name == "validate-image-on-test"
        assert str(submitted.playbook_path) == "discovery.yml"
        assert submitted.job_id == str(job_id)


================================================
FILE: build_stream/tests/utils/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Test utilities package."""

from .test_data import (
    generate_password_pair,
    generate_secure_password,
    generate_test_client_name,
    generate_test_email,
    generate_test_string,
)

__all__ = [
    "generate_secure_password",
    "generate_password_pair",
    "generate_test_string",
    "generate_test_email",
    "generate_test_client_name",
]


================================================
FILE: build_stream/tests/utils/test_data.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Utilities for generating secure test data.

This module provides functions to generate random test data
without using hard-coded values that could be security vulnerabilities.
"""

import secrets
import string
from typing import Tuple


def generate_secure_password(length: int = 16) -> str:
    """Generate a cryptographically secure random password.

    Args:
        length: Length of the password (default: 16)

    Returns:
        Random password meeting strength requirements
    """
    # Ensure minimum length for security
    if length < 8:
        raise ValueError("Password length must be at least 8 characters")

    # Character sets
    lowercase = string.ascii_lowercase
    uppercase = string.ascii_uppercase
    digits = string.digits
    special = "!@#$%^&*"

    # Start with one of each required character type
    password = [
        secrets.choice(lowercase),
        secrets.choice(uppercase),
        secrets.choice(digits),
        secrets.choice(special),
    ]

    # Fill remaining length with random characters from all sets
    all_chars = lowercase + uppercase + digits + special
    for _ in range(length - 4):
        password.append(secrets.choice(all_chars))

    # Shuffle to avoid predictable pattern
    secrets.SystemRandom().shuffle(password)

    return ''.join(password)


def generate_password_pair(length: int = 16) -> Tuple[str, str]:
    """Generate a pair of different secure passwords.

    Args:
        length: Length of each password (default: 16)

    Returns:
        Tuple of two different passwords
    """
    password1 = generate_secure_password(length)
    password2 = generate_secure_password(length)

    # Ensure they're different
    while password2 == password1:
        password2 = generate_secure_password(length)

    return password1, password2


def generate_test_string(prefix: str = "test", length: int = 10) -> str:
    """Generate a random test string with optional prefix.

    Args:
        prefix: Optional prefix for the string
        length: Length of random part (excluding prefix)

    Returns:
        Random string with prefix
    """
    random_part = ''.join(secrets.choice(string.ascii_lowercase + string.digits)
                         for _ in range(length))
    return f"{prefix}_{random_part}" if prefix else random_part


def generate_test_email(domain: str = "example.com") -> str:
    """Generate a random test email address.

    Args:
        domain: Domain for the email

    Returns:
        Random test email
    """
    local = generate_test_string("user", 8)
    return f"{local}@{domain}"


def generate_test_client_name() -> str:
    """Generate a random test client name.

    Returns:
        Random client name following validation rules
    """
    # Generate name that starts with alphanumeric and contains only allowed chars
    first_char = secrets.choice(string.ascii_lowercase + string.digits)
    rest = ''.join(secrets.choice(string.ascii_lowercase + string.digits + '-_')
                   for _ in range(10))
    return first_char + rest


================================================
FILE: build_stream/utils/__init__.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


================================================
FILE: common/library/module_utils/build_image/__init__.py
================================================


================================================
FILE: common/library/module_utils/build_image/common_functions.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""
Common utility functions for build_image modules.
Shared across additional_images_collector, base_image_package_collector,
and image_package_collector modules.
"""

import os
import json
import yaml


def load_json_file(path, module):
    """
    Load a JSON file safely.

    Args:
        path (str): Path to the JSON file.
        module (AnsibleModule): The Ansible module instance.

    Returns:
        dict or None: Parsed JSON content if successful, otherwise None.
    """
    if not os.path.isfile(path):
        module.log(f"File not found: {path}")
        return None
    try:
        with open(path, "r", encoding="utf-8") as f:
            return json.load(f)
    except Exception as e:
        module.log(f"Failed to read JSON file {path}: {e}")
        return None


def load_yaml_file(path, module):
    """
    Load a YAML file safely.

    Args:
        path (str): Path to the YAML file.
        module (AnsibleModule): The Ansible module instance, used for error reporting.

    Returns:
        dict: Parsed YAML content.

    Raises:
        Fails the module if the file cannot be read or parsed.
    """
    try:
        with open(path, "r", encoding="utf-8") as f:
            return yaml.safe_load(f)
    except Exception as e:
        module.fail_json(msg=f"Failed to read YAML file {path}: {e}")


def is_additional_packages_enabled(software_config):
    """
    Check if additional_packages is defined in softwares array of software_config.json.

    Args:
        software_config (dict): Parsed software_config.json content.

    Returns:
        bool: True if additional_packages is in softwares array.
    """
    if not software_config:
        return False
    softwares = software_config.get('softwares', [])
    return any(sw.get('name') == 'additional_packages' for sw in softwares)


def is_admin_debug_enabled(software_config):
    """
    Check if admin_debug_packages is defined in softwares array of software_config.json.

    Args:
        software_config (dict): Parsed software_config.json content.

    Returns:
        bool: True if admin_debug_packages is in softwares array.
    """
    if not software_config:
        return False
    softwares = software_config.get('softwares', [])
    return any(sw.get('name') == 'admin_debug_packages' for sw in softwares)


def get_allowed_additional_subgroups(software_config):
    """
    Get list of allowed subgroups from additional_packages array in software_config.json.

    Args:
        software_config (dict): Parsed software_config.json content.

    Returns:
        list: List of allowed subgroup names.
    """
    if not software_config:
        return []
    additional_packages_list = software_config.get('additional_packages', [])
    return [item.get('name') for item in additional_packages_list if item.get('name')]


def extract_rpm_package_names(cluster_items):
    """
    Extract RPM package names from a cluster list.

    Args:
        cluster_items (list): List of package items.

    Returns:
        list: List of package names (strings) where type is 'rpm'.
    """
    if not cluster_items or not isinstance(cluster_items, list):
        return []
    return [
        item.get('package') for item in cluster_items
        if item.get('type') == 'rpm' and item.get('package')
    ]


def deduplicate_list(items):
    """
    Deduplicate a list while preserving order.

    Args:
        items (list): List of items to deduplicate.

    Returns:
        list: Deduplicated list with original order preserved.
    """
    seen = set()
    unique_items = []
    for item in items:
        if item not in seen:
            unique_items.append(item)
            seen.add(item)
    return unique_items


================================================
FILE: common/library/module_utils/build_image/config.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""
Configuration constants for build image modules.
"""

# ----------------------------
# Role-specific keys for additional_packages.json
# Used by base_image_package_collector.py, image_package_collector.py and additional_images_collector.py
# ----------------------------
ROLE_SPECIFIC_KEYS = [
    "slurm_control_node",
    "slurm_node",
    "login_node",
    "login_compiler_node",
    "service_kube_control_plane_first",
    "service_kube_control_plane",
    "service_kube_node"
]

# ----------------------------
# Image role keys for container image collection
# Used by additional_images_collector.py for crictl pull operations
# ----------------------------
IMAGE_ROLE_KEYS = [
    "service_kube_control_plane",
    "service_kube_control_plane_first",
    "service_kube_node"
]


================================================
FILE: common/library/module_utils/discovery/__init__.py
================================================


================================================
FILE: common/library/module_utils/discovery/standard_functions.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

# pylint: disable=import-error,no-name-in-module,line-too-long

"""Standard functions for discovery and other modules."""

import os
import json
import yaml
from jinja2 import Template


def create_directory(path: str, mode: int) -> None:
    """Create a directory if it does not exist, with given permissions."""
    if not os.path.exists(path):
        os.makedirs(path, mode)
    else:
        os.chmod(path, mode)

def render_template(src: str, dest: str, context: dict) -> None:
    """Render a Jinja2 template from src to dest using context."""
    try:
        with open(src, 'r', encoding='utf-8') as f:
            template_content = f.read()
        template = Template(template_content)
        rendered = template.render(context)

        with open(dest, 'w', encoding='utf-8') as f:
            f.write(rendered)
    except Exception as e:
        raise RuntimeError(f"Template render error ({src} → {dest}): {e}") from e

def load_vars_file(path: str) -> dict:
    """Load YAML variables from a file and return as a dict."""
    if not path:
        return {}
    try:
        with open(path, 'r', encoding='utf-8') as f:
            return yaml.safe_load(f) or {}
    except Exception as e:
        raise RuntimeError(f"Failed to read vars file '{path}': {str(e)}") from e

def render_template_multi_pass(src: str, dest: str, context: dict, passes: int = 5) -> None:
    """Render a Jinja2 template from src to dest using context."""
    try:
        # Load the template
        with open(src, 'r', encoding='utf-8') as f:
            rendered = f.read()

        # Perform multiple rendering passes
        for _ in range(passes):
            rendered = Template(rendered).render(context)

        # Save the final rendered result
        with open(dest, 'w', encoding='utf-8') as f:
            f.write(rendered)
    except Exception as e:
        raise RuntimeError(f"Template render error ({src} → {dest}): {e}") from e

def update_json(new_data, filepath):
    """
    Update a JSON file with new data.

    Args:
        new_data (dict): The new data to be added to the JSON file.
        filepath (str): The path to the JSON file.

    Returns:
        None
    """
    if os.path.exists(filepath):
        # Load existing data
        with open(filepath, 'r') as f:
            try:
                existing_data = json.load(f)
            except json.JSONDecodeError:
                existing_data = {}
    else:
        existing_data = {}

    # Update with new data
    existing_data.update(new_data)

    # Write back to file
    with open(filepath, 'w') as f:
        json.dump(existing_data, f, indent=2)


================================================
FILE: common/library/module_utils/input_validation/__init__.py
================================================


================================================
FILE: common/library/module_utils/input_validation/common_utils/__init__.py
================================================


================================================
FILE: common/library/module_utils/input_validation/common_utils/config.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
"""
Configuration utilities for Omnia input validation modules.
"""
from datetime import datetime
import os

INPUT_VALIDATOR_LOG = '/opt/omnia/log/core/playbooks/input_validator/'

module_log_dir = {
    "input_validator_log": INPUT_VALIDATOR_LOG + "/_"+ datetime.now().strftime('_%d-%m-%Y.log')
}

# log path for input validator
INPUT_VALIDATOR_LOG_PATH = '/opt/omnia/log/core/playbooks/'

# Subscription checking paths - checked in order of priority
SYSTEM_ENTITLEMENT_PATH = '/etc/pki/entitlement/*.pem'
SYSTEM_REDHAT_REPO = '/etc/yum.repos.d/redhat.repo'

OMNIA_ENTITLEMENT_PATH = '/opt/omnia/rhel_repo_certs/*.pem'
OMNIA_REDHAT_REPO = '/opt/omnia/rhel_repo_certs/redhat.repo'

# Supported functional groups for additional_packages per architecture
ADDITIONAL_PACKAGES_SUPPORTED_SUBGROUPS = {
    "x86_64": [
        "slurm_control_node", "slurm_node", "login_node", "login_compiler_node",
        "service_kube_control_plane", "service_kube_control_plane_first", "service_kube_node"
    ],
    "aarch64": [
         "slurm_node", "login_node", "login_compiler_node"
    ]
}

# dict to hold the file names. If any file's name changes just change it here.
files = {
    "local_repo_config": "local_repo_config.yml",
    "network_spec": "network_spec.yml",
    "omnia_config": "omnia_config.yml",
    "provision_config": "provision_config.yml",
    "security_config": "security_config.yml",
    "software_config": "software_config.json",
    "storage_config": "storage_config.yml",
    "telemetry_config": "telemetry_config.yml",
    "high_availability_config": "high_availability_config.yml",
    "build_stream_config": "build_stream_config.yml",
    "gitlab_config": "gitlab_config.yml"
    # "additional_software": "additional_software.json"
}

# Tags and the files that will be run based off of it
input_file_inventory = {
    "build_image": [files["provision_config"]],
    "software_config": [files["software_config"]],
    "scheduler": [
        files["software_config"],

        files["omnia_config"]
        # files["high_availability_config"]
    ],
    "provision": [
        files["provision_config"],
        files["network_spec"],
        files["software_config"],
        # files["high_availability_config"]
    ],
    "security": [
        files["security_config"]
    ],
    "telemetry": [files["telemetry_config"]],
    "local_repo": [files["local_repo_config"], files["software_config"]],
    "slurm": [
        files["omnia_config"],
        files["storage_config"]
        # files["high_availability_config"]
    ],
    "service_k8s": [
        files["omnia_config"],
        files["storage_config"],
        files["high_availability_config"],
    ],
    "storage": [files["storage_config"]],
    "prepare_oim": [
        files["network_spec"],
        files["software_config"],
        files["build_stream_config"]
    ],
    # "high_availability": [files["high_availability_config"]],
    # "additional_software": [files["additional_software"]],
    "build_stream": [files["build_stream_config"]],
    "gitlab": [files["gitlab_config"], files["build_stream_config"]],
    "all": [
        files["local_repo_config"],
        files["network_spec"],
        files["omnia_config"],
        files["security_config"],
        files["telemetry_config"],
        files["provision_config"],
        files["software_config"],
        files["storage_config"],
        files["high_availability_config"],
        files["build_stream_config"],
        files["gitlab_config"],
    ],
}

expected_versions = {
    "amdgpu": "6.3.1",
    "cuda": "12.9.1",
    "ofed": "24.10-1.1.4.0",
    "beegfs": "7.4.5",
    "intel_benchmarks": "2024.1.0",
    "ucx": "1.19.0",
    "openmpi": "5.0.8",
    "csi_driver_powerscale": "v2.15.0",
    "rocm": "6.3.1",
    "service_k8s": "1.34.1"
}

# All of the passwords fields
passwords_set = {
    "slurm_db_password",
    "directory_manager_password",
    "kerberos_admin_password",
    "openldap_db_password",
    "openldap_config_password",
    "openldap_monitor_password",
    "timescaledb_password",
    "idrac_password",
    "mysqldb_password",
    "mysqldb_root_password",
    "grafana_password",
    "provision_password",
    "postgres_password",
    "bmc_password",
    "switch_snmp3_password",
    "docker_password"
}

extensions = {
    "json": ".json",
    "yml": ".yml"
}

os_version_ranges = {
    "rhel": ["10.0", "10.1"],
    #"rocky": ["9.4"],
    #"ubuntu": ["20.04", "22.04", "24.04"]
}


#dictionary used for local repo package type mapping
TYPE_REQUIREMENTS = {
    "rpm": ["package", "repo_name"],
    "rpm_list": ["package_list", "repo_name"],
    "rpm_file": ["package", "url"],
    "rpm_repo": ["package", "repo_name"],
    "ansible_galaxy_collection": ["package", "version"],
    "git": ["package", "version", "url"],
    "image": ["package", ["tag", "digest"]],  # Special: one of tag or digest
    "tarball": ["package", "url"],
    "shell": ["package", "url"],
    "iso": ["package", "url"],
    "manifest": ["package", "url"],
    "pip_module":["package"]
}

supported_telemetry_collection_type = ["victoria","kafka"]

FUNCTIONAL_GROUP_LAYER_MAP = {
    "service_kube_control_plane_first_x86_64": "management",
    "service_kube_control_plane_x86_64": "management",
    "service_kube_node_x86_64": "management",
    "login_node_x86_64": "management",
    "login_node_aarch64": "management",
    "login_compiler_node_x86_64": "management",
    "login_compiler_node_aarch64": "management",
    "slurm_control_node_x86_64": "management",
    "slurm_node_x86_64": "compute",
    "slurm_node_aarch64": "compute"
}

# used for security_config.yml validation
supported_ldap_connection_type = ["TLS","SLS"]
EMAIL_MAX_LENGTH = 320
EMAIL_SEARCH_KEY = "@"

# Dict of the file that can be encrypted and it's ansible vault key
def get_vault_password(yaml_file):
    """
    Retrieves the vault password file name associated with a given YAML file.

    This function maps a specific YAML file name to its corresponding Ansible Vault
    password file. It is typically used to locate the decryption key required for
    accessing encrypted configuration files.

    Parameters:
        yaml_file (str): The full path to the YAML configuration file.

    Returns:
        str: The name of the vault password file corresponding to the YAML file.

    Raises:
        KeyError: If the YAML file is not found in the predefined mapping.
    """
    vault_passwords = {
        "omnia_config_credentials.yml": ".omnia_config_credentials_key",
    }
    parts = yaml_file.split(os.sep)
    file = parts[-1]
    return vault_passwords[file]


================================================
FILE: common/library/module_utils/input_validation/common_utils/data_fetch.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
"""
This module is used to fetch data from files
"""
#!/usr/bin/python

import glob
import os
import json

# pylint: disable=import-error,no-name-in-module
from ansible.module_utils.input_validation.common_utils import validation_utils
from ansible.module_utils.input_validation.common_utils import config


# Function to get all files of a specific type recursively from a directory
def files_recursively(directory, file_type):
    """
    Returns a list of absolute file paths of all files
        of a specific type recursively from a directory.

    Args:
        directory (str): The base directory to search for files.
        file_type (str): The file type to search for.

    Returns:
        list: A list of absolute file paths.
    """
    file_list = []
    for file_path in glob.iglob(f"{directory}/**/*" + file_type, recursive=True):
        if os.path.isfile(file_path):
            file_list.append(os.path.abspath(file_path))
    return file_list


def file_name_from_path(file_path):
    """
    Get the file name from a given file path.
    Args:
        file_path (str): The path of the file.
    Returns:
        str: The file name.
    """
    return os.path.basename(file_path)


def json_line_number(file_path, json_path, module):
    """
    Get the line number of a specific json_path in a file.

    Args:
        file_path (str): The path to the file.
        json_path (str): The json_path to search for.

    Returns:
        tuple: A tuple containing the line number and a boolean indicating
            if the line number is valid. If the line number is not found, returns None.
    """
    is_line_num = True
    if '.' in json_path:
        json_path = json_path.split('.')[0] + "\":"
        is_line_num = False
    with open(file_path, "r", encoding="utf-8") as file:
        lines = file.readlines()
        if not lines:
            message = f"Unable to access and read file: {file_path}"
            module.fail_json(msg=message)
        # Iterate through the lines to find the JSON path
        for lineno, line in enumerate(lines, start=1):
            if json_path in line:
                return lineno, is_line_num
    return None


# Function to get the line number of a specific yaml_path in a file
def yml_line_number(file_path, yml_path, omnia_base_dir, project_name):
    """
    Get the line number of a specific YAML path in a file.

    Args:
        file_path (str): The path to the file.
        yml_path (str): The YAML path to search for.

    Returns:
        tuple: A tuple containing the line number and a boolean
            indicating if the line number is valid.
                Returns None if the line number is not found.
    """
    is_line_num = True
    # Check if the YAML path contains a dot and adjust the path accordingly
    if "." in yml_path:
        yml_path = yml_path.split(".")[0]
        is_line_num = False
    # If the file is encrypted, decrypt and read data, then reencrypt
    if validation_utils.is_file_encrypted(file_path):
        vault_password_file = config.get_vault_password(file_path)
        validation_utils.decrypt_file(omnia_base_dir, project_name, file_path, vault_password_file)
        with open(file_path, "r", encoding="utf-8") as file:
            for lineno, line in enumerate(file, start=1):
                if line and not line.startswith("#") and yml_path in line:
                    validation_utils.encrypt_file(
                        omnia_base_dir, project_name, file_path, vault_password_file
                    )
                    return lineno, is_line_num
        validation_utils.encrypt_file(omnia_base_dir, project_name, file_path, vault_password_file)
        return None
    # else open file and read its line
    with open(file_path, "r", encoding="utf-8") as file:
        for lineno, line in enumerate(file, start=1):
            if line and not line.startswith("#") and yml_path in line:
                return lineno, is_line_num
    return None


# Function to load input data from a file based on its extension
def input_data(input_file_path, omnia_base_dir, project_name, logger, module):
    """
    Loads input data from a file based on its extension.

    Args:
        input_file_path (str): The path to the input file.

    Returns:
        tuple: A tuple containing the loaded data and the file extension.

    Raises:
        ValueError: If the file extension is unsupported.
    """
    _, extension = os.path.splitext(input_file_path)
    if "json" in extension:
        try:
            with open(input_file_path, "r", encoding="utf-8") as file_obj:
                return json.load(file_obj), extension
        except json.JSONDecodeError as e:
            error_msg = (
                f"Failed to parse JSON file '{input_file_path}':\n"
                f"Error: {e.msg}\n"
                f"Line {e.lineno}, Column {e.colno}: {e.docline[e.colno-1:e.colno+10] if hasattr(e, 'docline') and e.docline else 'N/A'}\n"
                f"Please check the JSON syntax in the file."
            )
            logger.error(error_msg)
            return None, extension
        except FileNotFoundError:
            error_msg = f"File not found: {input_file_path}"
            logger.error(error_msg)
            return None, extension
        except (IOError, OSError, PermissionError) as exc:  # pragma: no cover - defensive
            error_msg = f"Error reading {input_file_path}: {exc}"
            logger.error(error_msg)
            return None, extension
        except Exception as exc:  # pragma: no cover - defensive
            error_msg = f"Unexpected error reading {input_file_path}: {exc}"
            logger.error(error_msg)
            return None, extension
    if "yml" in extension or "yaml" in extension:
        return (
            validation_utils.load_yaml_as_json(
                input_file_path, omnia_base_dir, project_name, logger, module
            ),
            extension,
        )
    message = f"Unsupported file extension: {extension}"
    raise ValueError(message)

================================================
FILE: common/library/module_utils/input_validation/common_utils/data_validation.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

#!/usr/bin/python

"""Main L1 Validation code. Get the JSON schema and input file to validate"""

import json
import jsonschema
import ansible.module_utils.input_validation.common_utils.data_fetch as get
from ansible.module_utils.input_validation.common_utils import en_us_validation_msg
from ansible.module_utils.input_validation.common_utils import logical_validation


def schema(config):
    """
    Validates the input file against a JSON schema.

    Args:
        config: dict with keys:
        - input_file_path
        - schema_file_path
        - passwords_set
        - omnia_base_dir
        - project_name
        - logger
        - module

    Returns:
        bool: True if the validation is successful, False otherwise.
    """
    input_file_path = config["input_file_path"]
    schema_file_path = config["schema_file_path"]
    passwords_set = config["passwords_set"]
    omnia_base_dir = config["omnia_base_dir"]
    project_name = config["project_name"]
    logger = config["logger"]
    module = config["module"]
    error_bucket = []
    try:
        input_data, extension = get.input_data(
            input_file_path, omnia_base_dir, project_name, logger, module
        )

        # If input_data is None, it means there was a YAML syntax error
        if input_data is None:
            error_bucket.append("input data reading failed.")
            return error_bucket

        # Normalize case-sensitive fields for omnia_config.yml
        if "omnia_config" in input_file_path:
            if "slurm_cluster" in input_data:
                for cluster in input_data["slurm_cluster"]:
                    if "node_discovery_mode" in cluster and isinstance(cluster["node_discovery_mode"], str):
                        cluster["node_discovery_mode"] = cluster["node_discovery_mode"].lower()

        # Load schema
        with open(schema_file_path, "r", encoding="utf-8") as schema_file:
            j_schema = json.load(schema_file)
        logger.debug(en_us_validation_msg.get_validation_initiated(input_file_path))

        validator = jsonschema.Draft7Validator(j_schema, format_checker=jsonschema.Draft7Validator.FORMAT_CHECKER)
        errors = sorted(validator.iter_errors(input_data), key=lambda e: e.path)

        # if errors exist, then print an error with the line number
        if errors:
            for error in errors:
                error_path = ".".join(map(str, error.path))

                # Custom error messages for regex pattern failures
                if "Groups" == error_path:
                    error.message = en_us_validation_msg.INVALID_GROUP_NAME_MSG
                elif "ports" in error_path:
                    error.message = en_us_validation_msg.INVALID_SWITCH_PORTS_MSG
                # TODO: Add a syntax error message for roles
                # elif 'is not of type' in error.message:
                #     error.message = en_us_validation_msg.INVALID_ATTRIBUTES_ROLE_MSG
                error_msg = f"Validation Error at {error_path}: {error.message}"
                # For passwords, mask the value so that no password values are logged
                if error.path and error.path[-1] in passwords_set:
                    parts = error.message.split(" ", 1)
                    if parts:
                        parts[0] = f"'{'*' * (len(parts[0]) - 2)}'"
                    error_msg = f"Validation Error at {error_path}: {' '.join(parts)}"
                # For all other fields, just log the value
                logger.error(error_msg)
                error_bucket.append(error_msg)
                # get the line number and log it
                line_number, is_line_num = None, False
                if "json" in extension:
                    line_number, is_line_num = get.json_line_number(
                        input_file_path, error_path, module
                    )
                elif "yml" in extension:
                    line_number, is_line_num = get.yml_line_number(
                        input_file_path, error_path, omnia_base_dir, project_name
                    )
                    logger.info(line_number, is_line_num)
                if line_number:
                    message = (
                        f"Error occurs on line {line_number}"
                        if is_line_num
                        else f"Error occurs on object or list entry on line {line_number}"
                    )
                    logger.error(message)
                    error_bucket.append(message)
            logger.error(en_us_validation_msg.get_schema_failed(input_file_path))
            error_bucket.append(en_us_validation_msg.get_schema_failed(input_file_path))
    except jsonschema.exceptions.SchemaError as schemaerror:
        message = f"Internal schema validation error: {schemaerror.message}"
        logger.error(message)
        error_bucket.append(message)
    except ValueError as valueerror:
        message = f"Value error at {input_file_path}: {valueerror}"
        logger.error(message)
        error_bucket.append(message)
    except Exception as exception:
        message = f"An unexpected error occurred: {exception}"
        logger.error(message)
        error_bucket.append(message)
    logger.info(en_us_validation_msg.get_schema_success(input_file_path))
    return error_bucket

# Code to run the L2 validation validate_input_logic function.
def logic(config):
    """
    Validates the logic of the input file.

    Args:
    config: dict with keys:
        - input_file_path (str): The path to the input file.
        - omnia_base_dir (str): The base directory of Omnia.
        - module_utils_base (str): The base directory of the module utils.
        - project_name (str): The name of the project.
        - logger (logging.Logger): The logger object.
        - module (AnsibleModule): The Ansible module.

    Returns:
        bool: True if the logic validation is successful, False otherwise.

    Raises:
        ValueError: If a value error occurs.
        Exception: If an unexpected error occurs.
    """
    input_file_path = config["input_file_path"]
    omnia_base_dir = config["omnia_base_dir"]
    module_utils_base = config["module_utils_base"]
    project_name = config["project_name"]
    logger = config["logger"]
    module = config["module"]
    error_bucket = []
    try:
        input_data, extension = get.input_data(
            input_file_path, omnia_base_dir, project_name, logger, module
        )

        errors = logical_validation.validate_input_logic(
            input_file_path,
            input_data,
            logger,
            module,
            omnia_base_dir,
            module_utils_base,
            project_name,
        )

        # Print errors, if the error value is None then send a separate message.
        # This is for values where it did not have a single key as the error
        if errors:
            for error in errors:
                error_msg = error.get("error_msg", "")
                error_key = error.get("error_key", "")
                error_value = error.get("error_value", "")

                err_msg = f"Validation Error at {error_key}: '{error_value}' {error_msg}"
                error_bucket.append(err_msg)
                logger.error(err_msg)

                # log the line number based off of the input config file extension
                if "yml" in extension:
                    result = get.yml_line_number(
                        input_file_path, error_key, omnia_base_dir, project_name
                    )
                    if result is not None:
                        line_number, is_line_num = result
                        if line_number:
                            message = (
                                f"Error occurs on line {line_number}"
                                if is_line_num
                                else f"Error occurs on object or list on line {line_number}"
                            )
                            logger.error(message)
                elif "json" in extension:
                    result = get.json_line_number(input_file_path, error_key, module)
                    if result is not None:
                        line_number, is_line_num = result
                        if line_number:
                            message = (
                                f"Error occurs on line {line_number}"
                                if is_line_num
                                else f"Error occurs on object or list on line {line_number}"
                            )
                            logger.error(message)

            logger.error(en_us_validation_msg.get_logic_failed(input_file_path))
            return error_bucket
    except ValueError as valueerror:
        message = f"Value error at {input_file_path}: {valueerror}"
        error_bucket.append(message)
        logger.error(message, exc_info=True)
        return error_bucket
    except Exception as exception:
        message = f"An unexpected error occurred: {exception}"
        error_bucket.append(message)
        logger.error(message, exc_info=True)
        return error_bucket
    logger.info(en_us_validation_msg.get_logic_success(input_file_path))
    return False


================================================
FILE: common/library/module_utils/input_validation/common_utils/data_verification.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
"""
This module contains functions for verifying the existence of files and directories.
"""
#!/usr/bin/python

import os


# Function to verify if a file exists at the given path
def file_exists(file_path, module, logger):
    """
    Verify if a file exists at the given path.

    Args:
        file_path (str): The path of the file.

    Returns:
        bool: True if the file exists, False otherwise.
    """
    if os.path.exists(file_path) and os.path.isfile(file_path):
        message = f"The file {file_path} exists"
        logger.info(message)
        return True
    message = f"The file {file_path} does not exist"
    logger.error(message)
    module.fail_json(msg=message)
    return False


# Function to verify if a directory exists at the given path
def directory_exists(directory_path, module, logger):
    """
    Verify if a directory exists at the given path.

    Args:
        directory_path (str): The path of the directory to check.

    Returns:
        bool: True if the directory exists, False otherwise.
    """
    if os.path.exists(directory_path) and os.path.isdir(directory_path):
        message = f"The directory {directory_path} exists."
        logger.info(message)
        return True
    message = f"The directory {directory_path} does not exist."
    logger.error(message)
    module.fail_json(msg=message)
    return False


================================================
FILE: common/library/module_utils/input_validation/common_utils/en_us_validation_msg.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

### All of these messages are used in logical_validation.py
"""
This module contains validation messages in English (US) for input validation.
These messages are used to provide user-friendly error messages during configuration validation.
"""
PRIMARY_ADMIN_IP_INTERFACE_MISMATCH_MSG = (
    "primary_oim_admin_ip does not match the actual IP configured on the specified interface"
)
NETMASK_BITS_INTERFACE_MISMATCH_MSG = (
    "netmask_bits does not match the netmask configured on the specified interface"
)
MISSING_CLUSTER_NAME_MSG = "Cluster name is mandatory for all kubernetes roles."
CLUSTER_NAME_OVERLAP_MSG = (
    "The cluster name '{0}' cannot be shared between service and compute Kubernetes roles."
)
CLUSTER_NAME_INCONSISTENT_MSG = (
    "Inconsistent 'cluster_name' values found across Service or Compute Kubernetes roles. "
    "Each of the following role sets must use the same 'cluster_name': "
    "[service_kube_control_plane, service_kube_node, service_etcd] and "
    "[kube_control_plane, kube_node, etcd].")
CLUSTER_ROLE_MISSING_MSG = (
    "Cluster '{0}' is missing the following required Kubernetes roles: {1}.")
MAX_NUMBER_OF_ROLES_MSG = "A max of 100 roles can be supported."
MIN_NUMBER_OF_GROUPS_MSG = "At least 1 group is required."
MIN_NUMBER_OF_ROLES_MSG = "At least 1 role is required."
MAX_NUMBER_OF_ROLES_PER_GROUP_MSG = "Groups can support a maximum of 5 roles."
RESOURCE_MGR_ID_MSG = ("The resource_mgr_id is mandatory if the group is mapped to "
                       "kube_node, slurm_node roles, service_kube_node, etcd, service_etcd roles.")
GRP_EXIST_MSG = "A valid group must be provided."
INVALID_SWITCH_IP_MSG = (
    "Please provide a valid switch IPv4 address (example: 10.5.0.1)."
)
GRP_ROLE_MSG = "Please associate this group with a role."
PARENT_SERVICE_NODE_MSG = (
    "A group associated with the management_layer should not have a parent value."
)
PARENT_SERVICE_ROLE_DNE_MSG = (
    "Parent field is only supported when 'service_kube_control_plane, service_kube_node' "
    "role is defined, Please remove the 'parent' field from this role's group definition."
)
PARENT_SERVICE_ROLE_MSG = (
    "A 'service_kube_control_plane, service_kube_node' role is not defined, so the "
    "'parent' field should be empty for groups associated with 'worker' or 'default' roles."
)
PARENT_SERVICE_ROLE_REQUIRED_MSG = (
    "When 'service_kube_control_plane', 'service_kube_node' role is defined, "
    "the 'parent' field is required for groups associated with 'worker' or 'default' roles."
)
BMC_STATIC_RANGE_INVALID_MSG = ("Static range should be in the following format: "
                               "IPv4Start-IPv4End (example: 10.5.0.1-10.5.0.200).")
OVERLAPPING_STATIC_RANGE = "bmc_detail's static_range is overlapping with other static ranges."
DUPLICATE_SWITCH_IP_PORT_MSG = "Please remove duplicate ports."
SWITCH_DETAILS_INCOMPLETE_MSG = ("If providing switch details, please provide both the IP "
                                 "and Ports fields.")
SWITCH_DETAILS_NO_BMC_DETAILS_MSG = ("If switch details are provided then bmc_detail's "
                                    "static_range must also be provided.")
INVALID_GROUP_NAME_MSG = "Groups must be defined in the form of grp<n> where n is 0-99."
INVALID_LOCATION_ID_MSG = ("location_id must follow the format SU-<n>.RACK-<n> where n is 0-99. "
                          "This input is case-sensitive. Please use uppercase letters only.")
INVALID_ATTRIBUTES_ROLE_MSG = ("Please provide valid attributes for the role, "
                              "both 'name' and 'groups' are mandatory.")
NO_GROUPS_MSG = "Outer Group object was probably not defined."
NO_ROLES_MSG = "Outer Role object was probably not defined."
INVALID_SWITCH_PORTS_MSG = (
    "Please provide any port ranges as start-end (example: 0-15,4:4,51-53)."
)
DUPLICATE_GROUP_NAME_MSG = "Duplicate group names are not allowed."
EMPTY_OR_SYNTAX_ERROR_ROLES_CONFIG_MSG = ("File is either empty or contains syntax errors. "
    "File must contain valid YAML with 'Roles' and 'Groups' "
    "sections along with valid syntax. Check the file content "
    "and ensure proper YAML formatting.")
DUPLICATE_GROUP_NAME_IN_LAYERS_MSG = ("The following groups are mapped to both frontend and "
                                     "compute layers, which is not allowed for group: [{0}] in "
                                     "frontend layer: [{1}] and compute layer: [{2}]")
SERVICE_NODE_ENTRY_MISSING_ROLES_CONFIG_MSG = ("The role service_node defined in roles_config.yml,"
    " but service_node entry missing in sofware_config.json, "
    "Please rerun local repo with service_node entry in software_config.json "
    "to deploy service nodes successfully")
SERVICE_K8S_ENTRY_MISSING_SOFTWARE_CONFIG_MSG = ("The role service_kube_control_plane is defined in roles_config.yml, "
    "but the service_k8s package entry is missing in software_config.json. "
    "To deploy Kubernetes in the service_k8s cluster, the package must be added to software_config.json.")
SERVICE_NODE_ENTRY_INVALID_ROLES_CONFIG_MSG = ("The 'service_node' role defined in roles_config.yml"
    " is not currently supported and is reserved for future use. Please remove or update this role" 
    " to avoid configuration errors.")

# Functional Groups Config Validation Messages

EMPTY_OR_SYNTAX_ERROR_FUNCTIONAL_GROUPS_CONFIG_MSG = (
    "The functional_groups_config.yml file is empty or has syntax errors." 
    "It must contain a valid 'functional_groups' section with proper YAML formatting."
    "Check the file content and rerun the playbook."
)
MISSING_GROUPS_SECTION_MSG = (
    "The functional_groups_config.yml file is empty or has syntax errors." 
    "It must contain a valid 'groups' section with proper YAML formatting."
    "Check the file content and rerun the playbook."
)
MISSING_FUNCTIONAL_GROUPS_SECTION_MSG = (
    "The functional_groups_config.yml file must contain a valid 'functional_groups' section. It must be a non-empty list."
)
NON_EMPTY_CLUSTER_NAME_MSG = "Cluster name must not be empty for '{name}' functional group."
FUNCTIONAL_GROUPS_NOT_LIST_MSG = (
    "The 'functional_groups' key must be associated with a list of functional group definitions."
)
EACH_FUNCTIONAL_GROUP_NOT_DICT_MSG = (
    "Each functional group entry must be a dictionary with required fields."
)
MISSING_FIELD_FUNCTIONAL_GROUP_MSG = "Missing required field: {field}"
DUPLICATE_FUNCTIONAL_GROUP_NAME_MSG = (
    "Duplicate functional group name found."
)
LOGIN_NODE_WITHOUT_SLURM_MSG = (
    "Login node defined for cluster '{cluster}' but no corresponding slurm_control_node exists."
    "Please make sure cluster name is same for slurm cluster and login_node functional groups."
)
SLURM_NODE_PARENT_MISSING_MSG = (
    "Functional group '{name}' must have a non-empty 'parent' field."    
)
MISSING_FUNCTIONAL_GROUPS_SECTION_MSG = (
    "The 'functional_groups' section is missing or null. It must be a non-empty list."
)
SLURM_NODE_WITHOUT_CONTROL_MSG = (
    "Slurm node defined for cluster '{cluster}' but no corresponding slurm_control_node exists. "
    "Please make sure cluster name is same for slurm_control_node and slurm_node functional groups."
)
SLURM_KUBE_CLUSTER_OVERLAP_MSG = (
    "Cluster '{cluster}' is defined for both SLURM nodes and Kubernetes nodes. Overlap not allowed."
)

# Mapping File Validation Messages
PROVISION_CONFIG_NOT_FOUND = (
    "provision_config.yml not found."
)
PXE_MAPPING_FILE_NOT_FOUND = (
    "PXE mapping file not found."
)
PXE_MAPPING_FILE_EMPTY_SERVICE_CLUSTER_MSG = (
    "PXE mapping file does not have functional groups for service cluster."
)
PXE_MAPPING_FILE_EMPTY_SLURM_CLUSTER_MSG = (
    "PXE mapping file does not have functional groups for slurm cluster."
)

# provision_config.yml
PRIMARY_ADMIN_BMC_IP_SAME_MSG = "primary_oim_admin_ip and primary_oim_bmc_ip should not be the same."
PRIMARY_ADMIN_IP_INVALID_MSG = "primary_oim_admin_ip is not a valid IPv4 address."
PRIMARY_BMC_IP_INVALID_MSG = "primary_oim_bmc_ip is not a valid IPv4 address."
PRIMARY_ADMIN_IP_IN_DYNAMIC_RANGE_MSG = "primary_oim_admin_ip should not be within the dynamic_range."
PRIMARY_BMC_IP_IN_DYNAMIC_RANGE_MSG = "primary_oim_bmc_ip should not be within the dynamic_range."
DEFAULT_LEASE_TIME_FAIL_MSG = "Please provide a valid default_lease_time."
ENABLE_SWITCH_BASED_FAIL_MSG = "enable_switch_based must be set to either true or false."
LANGUAGE_FAIL_MSG = "Only en_US.UTF-8 language supported"
LANGUAGE_EMPTY_MSG = "Language setting cannot be empty"
PUBLIC_NIC_FAIL_MSG = "public_nic is empty. Please provide a public_nic value."
PXE_MAPPING_FILE_PATH_FAIL_MSG = ("File path is invalid. Please ensure the file path specified in "
                                 "pxe_mapping_file_path exists and points to a valid file, "
                                 "not a directory.")
PXE_MAPPING_FILE_EXT_FAIL_MSG = ("File path is invalid. Please ensure that the file ends with "
                                 ".csv extension")
PXE_MAPPING_AARCH64_LOCAL_PATH_MSG = ("aarch64 nodes are present in pxe_mapping_file.csv but "
                                      "local share path selected for omnia core container deployment. "
                                      "aarch64 nodes require NFS share path. "
                                      "Please redeploy omnia core container with NFS share path option or remove aarch64 nodes "
                                      "from pxe_mapping_file.csv.")
CLUSTER_OS_FAIL_MSG = "Cluster OS must be 'rhel' for RHEL Omnia Infrastructure Manager"

# local_repo.yml
REPO_STORE_PATH_MSG = "Please provide a valid repo_store_path value."
OMNIA_REPO_URL_MSG = "Repo urls are empty. Please provide a url and corresponding key."
RHEL_OS_URL_MSG = "is empty. Please provide a rhel_os_url value."
UBUNTU_OS_URL_MSG = "ubuntu_os_url is empty. Please provide a ubuntu_os_url value."
LDMS_REQUIRES_SERVICE_K8S_MSG = (
    "requires service_k8s to be present in the 'softwares' list in software_config.json."
)
LDMS_REQUIRES_SLURM_MSG = (
    "requires Slurm package 'slurm_custom' to be present in the 'softwares' list in software_config.json."
)
USER_REPO_NAME_PREFIX_FAIL_MSG = (
    "Repository name '{repo_name}' in {repo_key} must start with '{expected_prefix}'. "
    "Please update the name to '{expected_prefix}{repo_name}'."
)

# omnia_config.yml
INVALID_PASSWORD_MSG = ("Provided password is invalid. Password must meet the specified "
                       "requirements: should not be empty, must have a length of at least "
                       "8 characters, and should not contain the following characters: "
                       "'-', '\\', \"'\", or '\"'")
K8S_CNI_FAIL_MSG = "k8s_cni is empty or invalid. k8s_cni must be set to either calico or flannel. "
POD_EXTERNAL_IP_RANGE_FAIL_MSG = ("pod_external_ip_range value is either empty or invalid. Please "
                                 "provide one of the following acceptable formats: '10.11.0.100-"
                                 "10.11.0.150' (range between start and end IP addresses) or "
                                 "'10.11.0.0/16' (CIDR notation).")
SLURM_INSTALLATION_TYPE_FAIL_MSG = ("slurm_installation_type is empty or invalid. "
                                   "slurm_installation_type_fail_msg must either be set to "
                                   "nfs_share or configless.")
RESTART_SLURM_SERVICES_FAIL_MSG = ("restart_slurm_services is empty or invalid. "
                                  "restart_slurm_services must be set to either true or false.")
K8S_SERVICE_ADDRESSES_FAIL_MSG = ("k8s_service_addresses are empty. "
                                  "Please provide k8s_service_addresses value.")
K8S_POD_NETWORK_CIDR_FAIL_MSG = ("k8s_pod_network_cidr is empty. "
                                 "Please provide a k8s_pod_network_cidr value.")
INTEL_GAUDI_FAIL_MSG = "should not be false as intel_gaudi exists in software_config.json"
CSI_DRIVER_SECRET_FAIL_MSG = "CSI Powerscale driver secret file path should not be empty."
CSI_DRIVER_VALUES_FAIL_MSG = "CSI Powerscale driver values file path should not be empty."

# provision_config_credentials.yml
PROVISION_PASSWORD_FAIL_MSG = ("Incorrect provision_password format. Password must meet the  "
                              "specified requirements: should not be empty, must have a "
                              "length of at least 8 characters, and should not contain the "
                              "following characters: '-', '\\', \"'\", or '\"'")
POSTGRESDB_PASSWORD_FAIL_MSG = ("Failed. postgresdb_password should contain only alphanumeric "
                               "characters and minimum length 8")
def bmc_username_fail_msg(min_username_length, max_length):
    """Returns a formatted message indicating bmc_username_fail_msg."""
    return (f"bmc_username length must be between {min_username_length} and "
            f"{max_length} characters. Must not contain '-', '\\', \"'\", or '\"'")

BMC_PASSWORD_FAIL_MSG = ("Incorrect bmc_password format. Password must meet the specified "
                        "requirements: should not be empty, must have a length of at least "
                        "3 characters, and should not contain the following characters: "
                        "'-', '\\', \"'\", or '\"'")
DOCKER_PASSWORD_FAIL_MSG = "Docker password must not be empty."
SWITCH_SNMP3_USERNAME_EMPTY_MSG = ("enabled_switch_based is set to true, "
                                   "switch_snmp3_username must not be empty")
SWITCH_SNMP3_PASSWORD_EMPTY_MSG = ("enabled_switch_based is set to true, "
                                   "switch_snmp3_password must not be empty")
def switch_snmp3_username_fail_msg(min_username_length, max_length):
    """Returns a formatted message indicating switch_snmp3_username_fail_msg."""
    return (f"switch_snmp3_username length must be between {min_username_length} "
            f"and {max_length} characters. Must not contain '-', '\\', \"'\", or '\"'")
SWITCH_SNMP3_PASSWORD_FAIL_MSG = ("switch_snmp3_password must be at least 3 characters. "
                                 "Must not contain '-', '\\', \"'\", or '\"'")


# telemetry_config.yml
KAFKA_ENABLE_FEDERATED_IDRAC_TELEMETRY_COLLECTION= ("requires federated_idrac_telemetry_collection "
                                             "to be enabled. Please rerun the playbook "
                                             "with federated_idrac_telemetry_collection true"
                                             "in telemetry_config.yml.")
TELEMETRY_SERVICE_CLUSTER_ENTRY_MISSING_ROLES_CONFIG_MSG= ("requires service k8s roles(service_kube_control_plane and service_kube_node)"
                                             " to be defined in 'pxe_mapping_file.csv'. Please either configure "
                                             "service k8s roles in the mapping file "
                                             "or disable idrac_telemetry_support in in telemetry_config.yml "
                                             "and rerun the playbook.")
TELEMETRY_SERVICE_CLUSTER_ENTRY_FOR_LDMS_MISSING_ROLES_CONFIG_MSG= ("requires service k8s roles(service_kube_control_plane "
                                             "and service_kube_node) or slurm nodes(slurm_control_node_x86_64 and slurm_node) "
                                             " to be defined in 'pxe_mapping_file.csv'. Please either configure "
                                             "service k8s/slurm roles in the mapping file or remove ldms from "
                                             "software_config.json and rerun the playbook.")

def boolean_fail_msg(value):
    """Returns a formatted message indicating boolean_fail_msg."""
    return f"{value} must be set to either true or false."
APPLIANCE_K8S_POD_NET_CIDR_FAIL_MSG = ("appliance_k8s_pod_net_cidr value is either empty or "
                                      "invalid. Please provide CIDR notation such as "
                                      "192.168.0.0/16")
K8S_PROMETHEUS_SUPPORT_FAIL_MSG = ("k8s_prometheus_support must be True when "
                                   "prometheus_gaudi_support is True.")
PROMETHEUS_SCRAPE_INTERVAL_FAIL_MSG = ("prometheus_scrape_interval must be at least 15 when "
                                      "prometheus_gaudi_support is True.")

# security_config.yml
DOMAIN_NAME_FAIL_MSG = "domain_name is empty. Please provide a domain_name value."
REALM_NAME_FAIL_MSG = "Failed. Incorrect realm_name formate in security_config.yml"
LDAP_CONNECTION_TYPE_FAIL_MSG = "Failed. LDAP Connection type must be: SSL, TLS, ssl or tls"
OPENLDAP_ORGANIZATION_FAIL_MSG = ("openldap_organization is empty. "
                                  "Please provide a openldap_organization value.")
OPENLDAP_ORGANIZATIONAL_UNIT_FAIL_MSG = ("openldap_organizational_unit is empty. "
                                         "Please provide a openldap_organizational_unit value.")
AUTHENTICATION_SYSTEM_FAIL_MSG = ("[WARNING] authentication_system variable in security_config.yml "
                                 "should be openldap")
AUTHENTICATION_SYSTEM_SUCCESS_MSG = "authentication_system variable successfully validated"
LDAP_CERT_PATH_FAIL_MSG = "Failed, LDAP certificate path doesn't exist."
ALERT_EMAIL_WARNING_MSG = ("[WARNING] alert_email_address is empty. "
                           "Authentication failure alerts won't be configured.")
ALERT_EMAIL_FAIL_MSG = ("Failed. Incorrect alert_email_address value "
                        "in login_node_security_config.yml")
SMTP_SERVER_FAIL_MSG = ("Failed. smtp_server details are mandatory when "
                        "alert_email_address provide in login_node_security_config.yml.")

# software_config.json

def os_version_fail_msg(cluster_os_type, min_version, max_version):
    """Returns a formatted message indicating os_version_fail_msg."""
    if cluster_os_type == "ubuntu":
        return (f"For OS type '{cluster_os_type}', the version must be either {min_version} or "
                f"{max_version}.")
    return f"For OS type '{cluster_os_type}', the supported version is {min_version}."
def software_mandatory_fail_msg(software_name):
    """Returns a formatted message indicating software_mandatory_fail_msg."""
    return (f"in software_config.json. Please add the corresponding field '{software_name}' "
            "to the JSON. Look at /examples/template_ubuntu_software_config.json for an example")
def json_file_mandatory(file_path):
    """Returns a formatted message indicating json_file_mandatory."""
    return (f"is present in software_config.json. Please make sure that the corresponding JSON file"
            f" is present at location '{file_path}'")

# network_spec.json
RANGE_IP_CHECK_FAIL_MSG = ("Failed. IP range should be in valid format "
                           "(Example: 192.168.1.1-192.168.1.254)")
RANGE_IP_CHECK_OVERLAP_MSG = "Static range and dynamic range in admin_network must not overlap"
NETWORK_GATEWAY_FAIL_MSG = ("Failed. network_gateway should be a valid IP address "
                            "(Example: 192.168.1.1)")
ADMIN_NETWORK_MISSING_MSG = "Failed. admin_network configuration is mandatory in network_spec.yml"
NETMASK_BITS_FAIL_MSG = "Netmask bit must be a valid number between 1 and 32"
RANGE_NETMASK_BOUNDARY_FAIL_MSG = ("IP range is outside the valid address range for "
                                   "the specified netmask.")
ADMIN_IP_OUTSIDE_NETWORK_RANGE_MSG = (
    "ADMIN_IP is outside the admin network range defined in "
    "network_spec.yml. Please ensure all ADMIN_IP addresses fall "
    "within the configured network range."
)
ADMIN_IP_IN_DYNAMIC_RANGE_MSG = (
    "ADMIN_IP falls within the dynamic_range which is reserved for DHCP. "
    "Please use a static IP address outside the dynamic range."
)
ADMIN_IP_CONFLICTS_WITH_PRIMARY_MSG = (
    "ADMIN_IP conflicts with the primary_oim_admin_ip defined in "
    "network_spec.yml. Please use a different IP address."
)
ADMIN_NETWORK_NOT_FOUND_MSG = (
    "admin_network configuration not found in network_spec.yml. "
    "Please ensure the Networks section contains admin_network."
)
PRIMARY_ADMIN_IP_NETMASK_REQUIRED_MSG = (
    "primary_oim_admin_ip and netmask_bits must be defined in "
    "network_spec.yml admin_network section."
)
INVALID_NETWORK_CONFIG_MSG = (
    "Invalid network configuration in network_spec.yml. "
    "Please verify primary_oim_admin_ip and netmask_bits are correct."
)
INVALID_DYNAMIC_RANGE_FORMAT_MSG = (
    "Invalid dynamic_range format in network_spec.yml. "
    "Expected format: 'start_ip-end_ip' (e.g., 10.1.1.10-10.1.1.50)."
)
ADMIN_IP_HOSTNAME_COLUMN_MISSING_MSG = (
    "ADMIN_IP or HOSTNAME column not found in PXE mapping file. "
    "Please ensure the CSV file has the required headers."
)
NETWORK_SPEC_FILE_NOT_FOUND_MSG = "network_spec.yml file not found in input folder."
IB_NETMASK_BITS_MISMATCH_MSG = (
    "netmask_bits configured for ib_network must match admin_network netmask_bits in network_spec.yml."
)
IB_SUBNET_IN_ADMIN_RANGE_MSG = (
    "ib_network subnet must be outside the admin network range derived from primary_oim_admin_ip/netmask_bits in network_spec.yml."
)

# telemetry
MANDATORY_FIELD_FAIL_MSG = "must not be empty"
MYSQLDB_USER_FAIL_MSG = "username should not be kept 'root'."
FUZZY_OFFSET_FAIL_MSG = "should be between 60 and omnia_telemetry_collection_interval value"
METRIC_COLLECTION_TIMEOUT_FAIL_MSG = ("should be greater than 0 and less than "
                                      "omnia_telemetry_collection_interval value")
MOUNT_LOCATION_FAIL_MSG = "should have '/' at the end of the path"
GRAFANA_PASSWORD_FAIL_MSG = "should not be kept 'admin'"

# security
FILE_PATH_FAIL_MSG = "path does not exist"
def tls_ext_fail_msg(valid_extensions):
    """Returns a formatted message indicating tls_ext_fail_msg."""
    extensions_list = ' or '.join(valid_extensions)
    return f"should have {extensions_list} extension"

# storage
BEEGFS_VERSION_FAIL_MSG = "Failed, Ensure version of beegfs is mentioned in software_config.json"
CLIENT_MOUNT_OPTIONS_FAIL_MSG = "should only contain nosuid,rw,sync,hard as options"
SLURM_SHARE_FAIL_MSG = "Exactly one entry should be present in nfs_client_params with slurm_share as true in storage_config.yml"
K8S_SHARE_FAIL_MSG = "Exactly one entry should be present in nfs_client_params with k8s_share as true in storage_config.yml"
BENCHMARK_TOOLS_FAIL_MSG = "Atleast one out of k8s_share or slurm_share in storage_config.yml should be true \
  when ucx/openmpi mentioned in software_config.json."
MULT_SHARE_FAIL_MSG = "Exactly one entry should be present in nfs_client_params with slurm_share as true or \
    k8s_share as true in storage_config.yml"
BEEGFS_UMOUNT_CLIENT_FAIL_MSG = "should be set to true since beegfs_mounts value has been changed"

# server_spec
SERVER_SPEC_NICNETWORKS_FAIL_MSG = ("in server_spec.yml must exist within network_spec.yml as a "
                                    "network name. Please check both files")
def server_spec_network_key_fail_msg(nic_device):
    """Returns a formatted message indicating server_spec_network_key_fail_msg."""
    return f"in server_spec.yml does not start with '{nic_device}' (nicdevices)"
IP_OVERLAP_FAIL_MSG = ("admin network, bmc network and k8 network and IP ranges should "
                       "not have any IP overlap. Check omnia_config.yml and network_spec.yml")
TELEMETRY_IP_OVERLAP_FAIL_MSG = ("admin network, telemetry network and IP ranges should "
                                 "not have any IP overlap. "
                                 "Check telemetry_config.yml and network_spec.yml")

# high_availability
VIRTUAL_IP_NOT_IN_ADMIN_SUBNET = ("virtual ip address provided is not in admin subnet. "
                                 "Check high_availability_config.yml and network_spec.yml")
VIRTUAL_IP_NOT_VALID = ("should be outside the admin static and dynamic ranges. "
                       "Check high_availability_config.yml and network_spec.yml")
VIRTUAL_IP_NOT_POD_EXT = ("should be outside the pod_external_ip ranges. "
                       "Check high_availability_config.yml and omnia_config.yml")
BMC_VIRTUAL_IP_NOT_VALID = ("should be outside any bmc static and dynamic ranges. "
                            "Check high_availability_config.yml, network_spec.yml, and "
                            "roles_config.yml")
FEILD_MUST_BE_EMPTY = "feild must be empty."
DUPLICATE_VIRTUAL_IP = "is already used. Please give unique virtual ip address"
VIRTUAL_IP_SAME_AS_PRIMARY_OIM_ADMIN_IP = ("virtual_ip_address provided in high_availability_config.yml must not be the same as primary_oim_admin_ip in network_spec.yml. "
                                           "Please provide a different virtual IP address.")
INVALID_PASSIVE_NODE_SERVICE_TAG = "active node and passive node service tag cannot be same."
GROUP_NOT_FOUND = "is not defined in the roles_config.yml. Please define the group in roles_config.yml"
ROLE_NODE_FOUND = "is not defined in roles_config.yml. Please define the role in roles_config.yml"
DUPLICATE_ACTIVE_NODE_SERVICE_TAG = ("the service tag configured for a active node is already "
                                    "present elsewhere in the config file. ")
DUPLICATE_PASSIVE_NODE_SERVICE_TAG = ("the service tag configured for a passive node is already "
                                     "present elsewhere in the config file. ")

# build_stream_config.yml
ENABLE_BUILD_STREAM_REQUIRED_MSG = "Field 'enable_build_stream' is required in build_stream_config.yml."
ENABLE_BUILD_STREAM_BOOLEAN_MSG = "Field 'enable_build_stream' must be a boolean (true or false)."
BUILD_STREAM_CONFIG_EMPTY_MSG = (
    "build_stream_config.yml file is empty or has syntax errors. "
    "It must contain valid YAML with 'enable_build_stream' field."
)
AARCH64_INVENTORY_HOST_IP_INVALID_SUBNET_MSG = (
    "Field 'aarch64_inventory_host_ip' must be in the same subnet as OIM admin IP. "
    "Check network_spec.yml for admin network configuration."
)

AARCH64_INVENTORY_HOST_IP_REQUIRED_MSG = (
    "Field 'aarch64_inventory_host_ip' is required when PXE mapping file contains aarch64 functional groups. "
    "Provide the admin IP of the aarch64 inventory host or remove aarch64 groups from PXE mapping."
)

AARCH64_INVENTORY_HOST_IP_NOT_REACHABLE_MSG = (
    "aarch64 inventory host IP {0} is not reachable on SSH port 22. "
    "Ensure the host is online, SSH service is running, and accessible from OIM."
)

AARCH64_INVENTORY_HOST_IP_REACHABILITY_CHECK_FAILED_MSG = (
    "Unable to verify reachability of aarch64 inventory host IP {0}. "
    "Ensure network connectivity and SSH service are available on the host."
)

BUILD_STREAM_PORT_RANGE_MSG = "build_stream_port must be an integer between 1 and 65535."
BUILD_STREAM_PORT_INUSE_MSG = (
    "Port {port} is already in use and is not serving build_stream on {host_ip}. Please choose another free port."
)
 
BUILD_STREAM_HOST_IP_REQUIRED_MSG = (
    "Field 'build_stream_host_ip' is mandatory in build_stream_config.yml. "
    "Please provide a valid IPv4 address (OIM admin IP or OIM public IP)."
)

def build_stream_host_ip_not_oim_ip_msg(ip, allowed_ips):
    """Returns error message for build_stream_host_ip not matching any OIM ethernet interface IP."""
    return (
        f"build_stream_host_ip '{ip}' is not a valid OIM IP address. "
        f"It must match an IP assigned to an ethernet interface on the OIM "
        f"(i.e., the OIM admin IP or OIM public IP). "
        f"Allowed IPs (from ethernet interfaces): {', '.join(allowed_ips)}. "
        f"Provide an IP configured on an OIM ethernet interface that is reachable from the host."
    )

BUILD_STREAM_HOST_IP_NO_ETHERNET_IPS_MSG = (
    "Unable to determine OIM ethernet interface IPs. "
    "Cannot validate build_stream_host_ip. Ensure nmcli and ip commands are available "
    "and ethernet interfaces are configured on the OIM."
)

# gitlab_config.yml
GITLAB_HOST_EMPTY_MSG = ("Field 'gitlab_host' is required and cannot be empty. "
                         "Provide the IPv4 address of the target host for GitLab deployment.")
GITLAB_HOST_INVALID_IP_MSG = ("Field 'gitlab_host' must be a valid IPv4 address. "
                              "Example: 192.168.1.10")
GITLAB_PROJECT_NAME_EMPTY_MSG = ("Field 'gitlab_project_name' is required and cannot be empty. "
                                 "Provide a valid GitLab project name.")
GITLAB_PROJECT_VISIBILITY_INVALID_MSG = ("Field 'gitlab_project_visibility' must be one of: "
                                         "private, internal, public.")
GITLAB_DEFAULT_BRANCH_EMPTY_MSG = ("Field 'gitlab_default_branch' is required and cannot be empty. "
                                   "Provide a valid git branch name. Default: main")
GITLAB_DEFAULT_BRANCH_INVALID_MSG = ("Field 'gitlab_default_branch' contains invalid characters. "
    "Branch name must start with alphanumeric and may contain "
                                     "letters, digits, dots, hyphens, underscores, or slashes.")
GITLAB_HTTPS_PORT_INVALID_MSG = ("Field 'gitlab_https_port' must be a valid port number between "
                                 "1 and 65535. Default: 443")
GITLAB_SSH_PORT_INVALID_MSG = ("Field 'gitlab_ssh_port' must be a valid port number between "
                               "1 and 65535. Default: 22")
GITLAB_PORTS_CONFLICT_MSG = ("Fields 'gitlab_https_port' and 'gitlab_ssh_port' must not use "
                             "the same port number.")
GITLAB_MIN_STORAGE_INVALID_MSG = ("Field 'gitlab_min_storage_gb' must be an integer >= 10. "
                                  "GitLab requires at least 10 GB of free disk space. Default: 20")
GITLAB_MIN_MEMORY_INVALID_MSG = ("Field 'gitlab_min_memory_gb' must be an integer >= 1. "
                                 "Default: 4")
GITLAB_MIN_CPU_INVALID_MSG = ("Field 'gitlab_min_cpu_cores' must be an integer >= 1. "
                              "Default: 2")
GITLAB_PUMA_WORKERS_INVALID_MSG = ("Field 'gitlab_puma_workers' must be an integer between "
                                   "1 and 64. Default: 2")
GITLAB_SIDEKIQ_CONCURRENCY_INVALID_MSG = ("Field 'gitlab_sidekiq_concurrency' must be an integer "
                                          "between 1 and 200. Default: 10")
GITLAB_OIM_VERIFY_SSL_INVALID_MSG = ("Field 'oim_api_verify_ssl' must be a boolean (true or false). "
                                     "Default: true")
GITLAB_CONFIG_EMPTY_MSG = ("gitlab_config.yml is empty or has syntax errors. "
    "It must contain valid YAML with required fields: "
    "gitlab_host, gitlab_project_name, gitlab_project_visibility, "
                           "gitlab_default_branch, gitlab_https_port.")

# addtional_software
ADDITIONAL_SOFTWARE_FAIL_MSG = "The additional_software is mandatory in additional_software.json"
ADDITIONAL_SOFTWARE_SUBGROUP_FAIL_MSG = ("The role or group name, [{0}] is present in subgroup "
                                         "but not present in roles_config.yml")
MISSING_IN_ADDITIONAL_SOFTWARE_MSG = ("The role or group name is present in software_config.json, "
                                     "but [{0}] is not present in additional_software.json")

# login_node_security
def restrict_softwares_fail_msg(software):
    """Returns error message for invalid software restriction in
       login node security configuration."""
    return (f'Invalid software "{software}". Can only disable these services: '
            f'telnet,lpd,bluetooth,rlogin,rexec.')

def get_header():
    """Returns a formatted header string for execution logs."""
    return f"{'#' * 30} START EXECUTION {'#' * 30}"

def get_footer():
    """Returns a formatted footer string for execution logs."""
    return f"{'#' * 30} END EXECUTION {'#' * 30}"

def get_validation_initiated(input_file_path):
    """Returns a formatted message indicating validation has started for a file."""
    return f"{'#' * 10} Validation Initiated for {input_file_path} {'#' * 10}"

def get_schema_failed(input_file_path):
    """Returns a formatted message indicating schema validation failure for a file."""
    return f"{'#' * 10} Schema validation failed for {input_file_path} {'#' * 10}"

def get_schema_success(input_file_path):
    """Returns a formatted message indicating schema validation success for a file."""
    return f"{'#' * 10} Schema validation successful for {input_file_path} {'#' * 10}"

def get_logic_failed(input_file_path):
    """Returns a formatted message indicating logic validation failure for a file."""
    return f"{'#' * 10} Logic validation failed for {input_file_path} {'#' * 10}"

def get_logic_success(input_file_path):
    """Returns a formatted message indicating logic validation success for a file."""
    return f"{'#' * 10} Logic validation successful for {input_file_path} {'#' * 10}"


================================================
FILE: common/library/module_utils/input_validation/common_utils/logical_validation.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# pylint: disable=import-error,too-many-arguments,too-many-positional-arguments,wrong-import-position
"""
This module contains functions for validating function based on the file data.
"""
import sys

sys.path.append("module_utils/validation_flows")

from ansible.module_utils.input_validation.validation_flows import provision_validation
from ansible.module_utils.input_validation.validation_flows import common_validation
from ansible.module_utils.input_validation.validation_flows import high_availability_validation
from ansible.module_utils.input_validation.validation_flows import local_repo_validation
from ansible.module_utils.input_validation.validation_flows import build_stream_validation
from ansible.module_utils.input_validation.validation_flows import gitlab_validation


# L2 Validation Code - validate anything that could not have been validated with JSON schema
# Main validation code that calls one of the validation functions based on the tag(s) used.
# input_file_inventory in validate_input.py contains dict of the tags being called.
def validate_input_logic(
    input_file_path,
    data,
    logger,
    module,
    omnia_base_dir,
    module_utils_base,
    project_name
):
    """
    Validates the input data based on the file name.

    Args:
        input_file_path (str): The path to the input file.
        data (dict): The data to be validated.
        logger (Logger): The logger object.
        module (AnsibleModule): The Ansible module object.
        omnia_base_dir (str): The base directory of Omnia.
        module_utils_base (str): The base directory of module_utils.
        project_name (str): The name of the project.

    Returns:
        list: A list of errors encountered during validation.
    """
    # Based on the file_name, run validation function
    validation_functions = {
        "provision_config.yml": provision_validation.validate_provision_config,
        "software_config.json": common_validation.validate_software_config,
        "network_spec.yml": provision_validation.validate_network_spec,
        "omnia_config.yml": common_validation.validate_omnia_config,
        "local_repo_config.yml": local_repo_validation.validate_local_repo_config,
        "telemetry_config.yml": common_validation.validate_telemetry_config,
        "security_config.yml": common_validation.validate_security_config,
        "storage_config.yml": common_validation.validate_storage_config,
        "high_availability_config.yml":
            high_availability_validation.validate_high_availability_config,
        "additional_software.json": common_validation.validate_additional_software,
        "build_stream_config.yml": build_stream_validation.validate_build_stream_config,
        "gitlab_config.yml": gitlab_validation.validate_gitlab_config,
    }

    path_parts = input_file_path.split("/")
    file_name = path_parts[-1]

    validation_function = validation_functions.get(file_name, None)
    print("validation_function", validation_function)
    if validation_function:
        return validation_function(
            input_file_path, data, logger, module, omnia_base_dir, module_utils_base, project_name
        )
    message = f"Unsupported file: {input_file_path, data}"
    logger.error(message)


================================================
FILE: common/library/module_utils/input_validation/common_utils/slurm_conf_utils.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

# These are the slurm options for version - 25.11
import re
import os
from enum import Enum
from collections import OrderedDict


class SlurmParserEnum(str, Enum):
    """Enumeration of Slurm configuration parameter types for parsing and validation."""

    S_P_IGNORE = "none"         # no value / ignored
    S_P_STRING = "str"          # generic string
    S_P_LONG = "int"            # integer (Python has only int)
    S_P_UINT16 = "int"          # unsigned int mapped to int
    S_P_UINT32 = "int"          # unsigned int mapped to int
    S_P_UINT64 = "int"          # unsigned int mapped to int
    S_P_POINTER = "object"      # generic object / pointer
    S_P_ARRAY = "array"         # list of dict
    S_P_BOOLEAN = "bool"        # boolean
    S_P_LINE = "str"            # line of text
    S_P_EXPLINE = "str"         # expanded line of text
    S_P_PLAIN_STRING = "str"    # plain string
    S_P_FLOAT = "float"         # floating point
    S_P_DOUBLE = "float"        # Python float is double precision
    S_P_LONG_DOUBLE = "float"   # approximate with float
    S_P_CSV = "csv"             # comma separated values
    S_P_LIST = "list"           # list of strings


# Convenience aliases (if other modules refer to S_P_* directly)
S_P_IGNORE = SlurmParserEnum.S_P_IGNORE
S_P_STRING = SlurmParserEnum.S_P_STRING
S_P_LONG = SlurmParserEnum.S_P_LONG
S_P_UINT16 = SlurmParserEnum.S_P_UINT16
S_P_UINT32 = SlurmParserEnum.S_P_UINT32
S_P_UINT64 = SlurmParserEnum.S_P_UINT64
S_P_POINTER = SlurmParserEnum.S_P_POINTER
S_P_ARRAY = SlurmParserEnum.S_P_ARRAY
S_P_BOOLEAN = SlurmParserEnum.S_P_BOOLEAN
S_P_LINE = SlurmParserEnum.S_P_LINE
S_P_EXPLINE = SlurmParserEnum.S_P_EXPLINE
S_P_PLAIN_STRING = SlurmParserEnum.S_P_PLAIN_STRING
S_P_FLOAT = SlurmParserEnum.S_P_FLOAT
S_P_DOUBLE = SlurmParserEnum.S_P_DOUBLE
S_P_LONG_DOUBLE = SlurmParserEnum.S_P_LONG_DOUBLE
S_P_CSV = SlurmParserEnum.S_P_CSV
S_P_LIST = SlurmParserEnum.S_P_LIST


slurm_downnodes_options = {
    "DownNodes": S_P_STRING,
    "Reason": S_P_STRING,
    "State": S_P_STRING,
}


slurm_nodename_options = {
    "NodeName": S_P_STRING,
    "BcastAddr": S_P_STRING,
    "Boards": S_P_UINT16,
    "CoreSpecCount": S_P_UINT16,
    "CoresPerSocket": S_P_UINT16,
    "CPUs": S_P_UINT16,
    "CPUSpecList": S_P_CSV,
    "CpuBind": S_P_STRING,
    "Feature": S_P_STRING,
    "Features": S_P_CSV,
    "Gres": S_P_CSV,
    "GresConf": S_P_STRING,
    "MemSpecLimit": S_P_UINT64,
    "NodeAddr": S_P_STRING,
    "NodeHostname": S_P_STRING,
    "Parameters": S_P_STRING,
    "Port": S_P_STRING,
    "Procs": S_P_UINT16,
    "RealMemory": S_P_UINT64,
    "Reason": S_P_STRING,
    "RestrictedCoresPerGPU": S_P_UINT16,
    "Sockets": S_P_UINT16,
    "SocketsPerBoard": S_P_UINT16,
    "State": S_P_STRING,
    "ThreadsPerCore": S_P_UINT16,
    "TmpDisk": S_P_UINT32,
    "Topology": S_P_CSV,
    "TRESWeights": S_P_STRING,
    "Weight": S_P_UINT32,
}


slurm_nodeset_options = {
    "NodeSet": S_P_STRING,
    "Feature": S_P_STRING,
    "Nodes": S_P_STRING
}


slurm_partitionname_options = {
    "PartitionName": S_P_STRING,
    "AllocNodes": S_P_CSV,
    "AllowAccounts": S_P_CSV,
    "AllowGroups": S_P_CSV,
    "AllowQos": S_P_CSV,
    "Alternate": S_P_STRING,
    "CpuBind": S_P_STRING,
    "DefCPUPerGPU": S_P_UINT64,
    "DefMemPerCPU": S_P_UINT64,
    "DefMemPerGPU": S_P_UINT64,
    "DefMemPerNode": S_P_UINT64,
    "Default": S_P_BOOLEAN,
    "DefaultTime": S_P_STRING,
    "DenyAccounts": S_P_CSV,
    "DenyQos": S_P_CSV,
    "DisableRootJobs": S_P_BOOLEAN,
    "ExclusiveUser": S_P_BOOLEAN,
    "ExclusiveTopo": S_P_BOOLEAN,
    "GraceTime": S_P_UINT32,
    "Hidden": S_P_BOOLEAN,
    "LLN": S_P_BOOLEAN,
    "MaxCPUsPerNode": S_P_UINT32,
    "MaxCPUsPerSocket": S_P_UINT32,
    "MaxMemPerCPU": S_P_UINT64,
    "MaxMemPerNode": S_P_UINT64,
    "MaxTime": S_P_STRING,
    "MaxNodes": S_P_UINT32,
    "MinNodes": S_P_UINT32,
    "Nodes": S_P_CSV,
    "OverSubscribe": S_P_STRING,
    "OverTimeLimit": S_P_STRING,
    "PowerDownOnIdle": S_P_BOOLEAN,
    "PreemptMode": S_P_STRING,
    "Priority": S_P_UINT16,
    "PriorityJobFactor": S_P_UINT16,
    "PriorityTier": S_P_UINT16,
    "QOS": S_P_STRING,
    "RootOnly": S_P_BOOLEAN,
    "ReqResv": S_P_BOOLEAN,
    "ResumeTimeout": S_P_UINT16,
    "SelectTypeParameters": S_P_STRING,
    "Shared": S_P_STRING,
    "State": S_P_STRING,
    "SuspendTime": S_P_STRING,
    "SuspendTimeout": S_P_UINT16,
    "Topology": S_P_STRING,
    "TRESBillingWeights": S_P_CSV
}

# From
# https://github.com/SchedMD/slurm/blob/slurm-<VERSION>/src/common/read_config.c
slurm_options = {
    "AccountingStorageBackupHost": S_P_STRING,
    "AccountingStorageEnforce": S_P_CSV,
    "AccountingStorageExternalHost": S_P_CSV,
    "AccountingStorageHost": S_P_STRING,
    "AccountingStorageParameters": S_P_CSV,
    "AccountingStoragePass": S_P_STRING,
    "AccountingStoragePort": S_P_UINT16,
    "AccountingStorageTRES": S_P_CSV,
    "AccountingStorageType": S_P_STRING,
    # {"AccountingStorageUser": S_P_STRING, _defunct_option,
    "AccountingStoreFlags": S_P_CSV,
    "AccountingStoreJobComment": S_P_BOOLEAN,
    "AcctGatherEnergyType": S_P_STRING,
    "AcctGatherFilesystemType": S_P_STRING,
    "AcctGatherInfinibandType": S_P_STRING,
    "AcctGatherInterconnectType": S_P_STRING,
    "AcctGatherNodeFreq": S_P_UINT16,
    "AcctGatherProfileType": S_P_STRING,
    "AllowSpecResourcesUsage": S_P_BOOLEAN,
    "AuthAltParameters": S_P_CSV,
    "AuthAltTypes": S_P_CSV,
    "AuthInfo": S_P_CSV,
    "AuthType": S_P_STRING,
    "BackupAddr": S_P_STRING,
    "BackupController": S_P_STRING,
    "BatchStartTimeout": S_P_UINT16,
    "BcastExclude": S_P_CSV,
    "BcastParameters": S_P_CSV,
    "BurstBufferParameters": S_P_STRING,
    "BurstBufferType": S_P_STRING,
    "CertgenType": S_P_STRING,
    "CertgenParameters": S_P_CSV,
    "CertmgrType": S_P_STRING,
    "CertmgrParameters": S_P_STRING,
    "CliFilterParameters": S_P_CSV,
    "CliFilterPlugins": S_P_CSV,
    "ClusterName": S_P_STRING,
    "CommunicationParameters": S_P_CSV,
    "CompleteWait": S_P_UINT16,
    "ControlAddr": S_P_STRING,
    "ControlMachine": S_P_STRING,
    # {"CoreSpecPlugin": S_P_STRING, _defunct_option,
    "CpuFreqDef": S_P_STRING,
    "CpuFreqGovernors": S_P_STRING,
    "CredType": S_P_STRING,
    "CryptoType": S_P_STRING,
    "DataParserParameters": S_P_STRING,
    "DebugFlags": S_P_CSV,
    "DefCPUPerGPU": S_P_UINT64,
    "DefMemPerCPU": S_P_UINT64,
    "DefMemPerGPU": S_P_UINT64,
    "DefMemPerNode": S_P_UINT64,
    "DependencyParameters": S_P_CSV,
    "DisableRootJobs": S_P_BOOLEAN,
    "EioTimeout": S_P_UINT16,
    "EnforcePartLimits": S_P_STRING,
    "Epilog": S_P_LIST,
    "EpilogMsgTime": S_P_UINT32,
    "EpilogSlurmctld": S_P_LIST,
    "EpilogTimeout": S_P_UINT16,
    # {"ExtSensorsFreq": S_P_UINT16, _defunct_option,
    # {"ExtSensorsType": S_P_STRING, _defunct_option,
    "FairShareDampeningFactor": S_P_UINT16,
    "FastSchedule": S_P_UINT16,
    "FederationParameters": S_P_CSV,
    "FirstJobId": S_P_UINT32,
    # {"GetEnvTimeout": S_P_UINT16, _defunct_option,
    "GpuFreqDef": S_P_STRING,
    "GresTypes": S_P_CSV,
    "GroupUpdateForce": S_P_UINT16,
    "GroupUpdateTime": S_P_UINT16,
    "HashPlugin": S_P_STRING,
    "HealthCheckInterval": S_P_UINT16,
    "HealthCheckNodeState": S_P_CSV,
    "HealthCheckProgram": S_P_STRING,
    "HttpParserType": S_P_STRING,
    "InactiveLimit": S_P_UINT16,
    "InteractiveStepOptions": S_P_STRING,
    "JobAcctGatherFrequency": S_P_STRING,
    "JobAcctGatherParams": S_P_STRING,
    "JobAcctGatherType": S_P_STRING,
    "JobCompHost": S_P_STRING,
    "JobCompLoc": S_P_STRING,
    "JobCompParams": S_P_CSV,
    "JobCompPass": S_P_STRING,
    "JobCompPassScript": S_P_STRING,
    "JobCompPort": S_P_UINT32,
    "JobCompType": S_P_STRING,
    "JobCompUser": S_P_STRING,
    "JobContainerType": S_P_STRING,
    # {"JobCredentialPrivateKey": S_P_STRING, _defunct_option,
    # {"JobCredentialPublicCertificate": S_P_STRING, _defunct_option,
    "JobFileAppend": S_P_UINT16,
    "JobRequeue": S_P_UINT16,
    "JobSubmitPlugins": S_P_CSV,
    "KeepAliveTime": S_P_UINT32,
    "KillOnBadExit": S_P_UINT16,
    "KillWait": S_P_UINT16,
    "LaunchParameters": S_P_STRING,
    "LaunchType": S_P_STRING,
    "Licenses": S_P_CSV,
    "LogTimeFormat": S_P_STRING,
    "MailDomain": S_P_STRING,
    "MailProg": S_P_STRING,
    "MaxArraySize": S_P_UINT32,
    "MaxBatchRequeue": S_P_UINT32,
    "MaxDBDMsgs": S_P_UINT32,
    "MaxJobCount": S_P_UINT32,
    "MaxJobId": S_P_UINT32,
    "MaxMemPerCPU": S_P_UINT64,
    "MaxMemPerNode": S_P_UINT64,
    "MaxNodeCount": S_P_UINT32,
    "MaxStepCount": S_P_UINT32,
    "MaxTasksPerNode": S_P_UINT16,
    "MCSParameters": S_P_STRING,
    "MCSPlugin": S_P_STRING,
    "MessageTimeout": S_P_UINT16,
    "MetricsType": S_P_STRING,
    "MinJobAge": S_P_UINT32,
    "MpiDefault": S_P_STRING,
    "MpiParams": S_P_CSV,
    "NamespaceType": S_P_STRING,
    "NodeFeaturesPlugins": S_P_STRING,
    "OverTimeLimit": S_P_UINT16,
    "PluginDir": S_P_STRING,
    "PlugStackConfig": S_P_STRING,
    # {"PowerParameters": S_P_STRING, _defunct_option,
    # {"PowerPlugin": S_P_STRING, _defunct_option,
    "PreemptExemptTime": S_P_STRING,
    "PreemptMode": S_P_CSV,
    "PreemptParameters": S_P_CSV,
    "PreemptType": S_P_STRING,
    "PrEpParameters": S_P_STRING,
    "PrEpPlugins": S_P_CSV,
    "PriorityCalcPeriod": S_P_STRING,
    "PriorityDecayHalfLife": S_P_STRING,
    "PriorityFavorSmall": S_P_BOOLEAN,
    "PriorityFlags": S_P_STRING,
    "PriorityMaxAge": S_P_STRING,
    "PriorityParameters": S_P_STRING,
    "PrioritySiteFactorParameters": S_P_STRING,
    "PrioritySiteFactorPlugin": S_P_STRING,
    "PriorityType": S_P_STRING,
    "PriorityUsageResetPeriod": S_P_STRING,
    "PriorityWeightAge": S_P_UINT32,
    "PriorityWeightAssoc": S_P_UINT32,
    "PriorityWeightFairshare": S_P_UINT32,
    "PriorityWeightJobSize": S_P_UINT32,
    "PriorityWeightPartition": S_P_UINT32,
    "PriorityWeightQOS": S_P_UINT32,
    "PriorityWeightTRES": S_P_CSV,
    "PrivateData": S_P_CSV,
    "ProctrackType": S_P_STRING,
    "Prolog": S_P_LIST,
    "PrologEpilogTimeout": S_P_UINT16,
    "PrologFlags": S_P_CSV,
    "PrologSlurmctld": S_P_LIST,
    "PrologTimeout": S_P_UINT16,
    "PropagatePrioProcess": S_P_UINT16,
    "PropagateResourceLimits": S_P_CSV,
    "PropagateResourceLimitsExcept": S_P_CSV,
    "RebootProgram": S_P_STRING,
    "ReconfigFlags": S_P_STRING,
    "RequeueExit": S_P_CSV,
    "RequeueExitHold": S_P_CSV,
    "ResumeFailProgram": S_P_STRING,
    "ResumeProgram": S_P_STRING,
    "ResumeRate": S_P_UINT16,
    "ResumeTimeout": S_P_UINT16,
    "ResvEpilog": S_P_STRING,
    "ResvOverRun": S_P_UINT16,
    "ResvProlog": S_P_STRING,
    "ReturnToService": S_P_UINT16,
    "RoutePlugin": S_P_STRING,
    "SallocDefaultCommand": S_P_STRING,
    "SbcastParameters": S_P_STRING,
    "SchedulerParameters": S_P_CSV,
    "SchedulerTimeSlice": S_P_UINT16,
    "SchedulerType": S_P_STRING,
    "ScronParameters": S_P_CSV,
    "SelectType": S_P_STRING,
    "SelectTypeParameters": S_P_STRING,
    "SlurmctldAddr": S_P_STRING,
    "SlurmctldDebug": S_P_STRING,
    "SlurmctldLogFile": S_P_STRING,
    "SlurmctldParameters": S_P_CSV,
    "SlurmctldPidFile": S_P_STRING,
    "SlurmctldPort": S_P_STRING,
    "SlurmctldPrimaryOffProg": S_P_STRING,
    "SlurmctldPrimaryOnProg": S_P_STRING,
    "SlurmctldSyslogDebug": S_P_STRING,
    "SlurmctldTimeout": S_P_UINT16,
    "SlurmdDebug": S_P_STRING,
    "SlurmdLogFile": S_P_STRING,
    "SlurmdParameters": S_P_CSV,
    "SlurmdPidFile": S_P_STRING,
    "SlurmdPort": S_P_UINT32,
    "SlurmdSpoolDir": S_P_STRING,
    "SlurmdSyslogDebug": S_P_STRING,
    "SlurmdTimeout": S_P_UINT16,
    "SlurmdUser": S_P_STRING,
    "SlurmSchedLogFile": S_P_STRING,
    "SlurmSchedLogLevel": S_P_UINT16,
    "SlurmUser": S_P_STRING,
    "SrunEpilog": S_P_STRING,
    "SrunPortRange": S_P_STRING,
    "SrunProlog": S_P_STRING,
    "StateSaveLocation": S_P_STRING,
    "SuspendExcNodes": S_P_CSV,
    "SuspendExcParts": S_P_CSV,
    "SuspendExcStates": S_P_STRING,
    "SuspendProgram": S_P_STRING,
    "SuspendRate": S_P_UINT16,
    "SuspendTime": S_P_STRING,
    "SuspendTimeout": S_P_UINT16,
    "SwitchParameters": S_P_CSV,
    "SwitchType": S_P_STRING,
    "TaskEpilog": S_P_STRING,
    "TaskPlugin": S_P_CSV,
    "TaskPluginParam": S_P_CSV,
    "TaskProlog": S_P_STRING,
    "TCPTimeout": S_P_UINT16,
    "TLSParameters": S_P_CSV,
    "TLSType": S_P_STRING,
    "TmpFS": S_P_STRING,
    "TopologyParam": S_P_CSV,
    "TopologyPlugin": S_P_STRING,
    "TrackWCKey": S_P_BOOLEAN,
    "TreeWidth": S_P_UINT16,
    "UnkillableStepProgram": S_P_STRING,
    "UnkillableStepTimeout": S_P_UINT16,
    "UrlParserType": S_P_STRING,
    "UsePAM": S_P_BOOLEAN,
    "VSizeFactor": S_P_UINT16,
    "WaitTime": S_P_UINT16,
    "X11Parameters": S_P_STRING,
    "DownNodes": S_P_ARRAY,
    "NodeName": S_P_ARRAY,
    "NodeSet": S_P_ARRAY,
    "PartitionName": S_P_ARRAY,
    "SlurmctldHost": S_P_LIST
}

# From
# https://github.com/SchedMD/slurm/blob/slurm-<VERSION>/src/slurmdbd/read_config.c
slurmdbd_options = {
    "AllowNoDefAcct": S_P_BOOLEAN,
    "AllResourcesAbsolute": S_P_BOOLEAN,
    "ArchiveDir": S_P_STRING,
    "ArchiveEvents": S_P_BOOLEAN,
    "ArchiveJobs": S_P_BOOLEAN,
    "ArchiveResvs": S_P_BOOLEAN,
    "ArchiveScript": S_P_STRING,
    "ArchiveSteps": S_P_BOOLEAN,
    "ArchiveSuspend": S_P_BOOLEAN,
    "ArchiveTXN": S_P_BOOLEAN,
    "ArchiveUsage": S_P_BOOLEAN,
    "AuthAltTypes": S_P_CSV,
    "AuthAltParameters": S_P_CSV,
    "AuthInfo": S_P_CSV,
    "AuthType": S_P_STRING,
    "CommitDelay": S_P_UINT16,
    "CommunicationParameters": S_P_CSV,
    "DbdAddr": S_P_STRING,
    "DbdBackupHost": S_P_STRING,
    "DbdHost": S_P_STRING,
    "DbdPort": S_P_UINT16,
    "DebugFlags": S_P_STRING,
    "DebugLevel": S_P_STRING,
    "DebugLevelSyslog": S_P_STRING,
    "DefaultQOS": S_P_STRING,
    "DisableCoordDBD": S_P_BOOLEAN,
    "DisableArchiveCommands": S_P_BOOLEAN,
    "HashPlugin": S_P_STRING,
    "JobPurge": S_P_UINT32,
    "LogFile": S_P_STRING,
    "LogTimeFormat": S_P_STRING,
    "MaxPurgeLimit": S_P_UINT32,
    "MaxQueryTimeRange": S_P_STRING,
    "MessageTimeout": S_P_UINT16,
    "Parameters": S_P_CSV,
    "PidFile": S_P_STRING,
    "PluginDir": S_P_STRING,
    "PrivateData": S_P_CSV,
    "PurgeEventAfter": S_P_STRING,
    "PurgeJobAfter": S_P_STRING,
    "PurgeResvAfter": S_P_STRING,
    "PurgeStepAfter": S_P_STRING,
    "PurgeSuspendAfter": S_P_STRING,
    "PurgeTXNAfter": S_P_STRING,
    "PurgeUsageAfter": S_P_STRING,
    "PurgeEventMonths": S_P_UINT32,
    "PurgeJobMonths": S_P_UINT32,
    "PurgeStepMonths": S_P_UINT32,
    "PurgeSuspendMonths": S_P_UINT32,
    "PurgeTXNMonths": S_P_UINT32,
    "PurgeUsageMonths": S_P_UINT32,
    "SlurmUser": S_P_STRING,
    "StepPurge": S_P_UINT32,
    "StorageBackupHost": S_P_STRING,
    "StorageHost": S_P_STRING,
    "StorageLoc": S_P_STRING,
    "StorageParameters": S_P_CSV,
    "StoragePass": S_P_STRING,
    "StoragePassScript": S_P_STRING,
    "StoragePort": S_P_UINT16,
    "StorageType": S_P_STRING,
    "StorageUser": S_P_STRING,
    "TCPTimeout": S_P_UINT16,
    "TLSParameters": S_P_CSV,
    "TLSType": S_P_STRING,
    "TrackWCKey": S_P_BOOLEAN,
    "TrackSlurmctldDown": S_P_BOOLEAN
}

# From
# https://github.com/SchedMD/slurm/blob/slurm-<VERSION>/src/interfaces/cgroup.c#L332
cgroup_options = {
    "CgroupAutomount": S_P_BOOLEAN,
    "CgroupMountpoint": S_P_STRING,
    "CgroupSlice": S_P_STRING,
    "ConstrainCores": S_P_BOOLEAN,
    "ConstrainRAMSpace": S_P_BOOLEAN,
    "AllowedRAMSpace": S_P_FLOAT,
    "MaxRAMPercent": S_P_FLOAT,
    "MinRAMSpace": S_P_UINT64,
    "ConstrainSwapSpace": S_P_BOOLEAN,
    "AllowedSwapSpace": S_P_FLOAT,
    "MaxSwapPercent": S_P_FLOAT,
    "MemoryLimitEnforcement": S_P_BOOLEAN,
    "MemoryLimitThreshold": S_P_FLOAT,
    "ConstrainDevices": S_P_BOOLEAN,
    "AllowedDevicesFile": S_P_STRING,
    "MemorySwappiness": S_P_UINT64,
    "CgroupPlugin": S_P_STRING,
    "IgnoreSystemd": S_P_BOOLEAN,
    "IgnoreSystemdOnFailure": S_P_BOOLEAN,
    "EnableControllers": S_P_BOOLEAN,
    "EnableExtraControllers": S_P_STRING,
    "SignalChildrenProcesses": S_P_BOOLEAN,
    "SystemdTimeout": S_P_UINT64
}

# From
# https://github.com/SchedMD/slurm/blob/slurm-<VERSION>s/src/interfaces/gres.c#L101C40-L116C2
_gres_options = {
    "AutoDetect": S_P_STRING,
    "Count": S_P_STRING,  # Number of Gres available
    "CPUs": S_P_STRING,  # CPUs to bind to Gres resource
    "Cores": S_P_CSV,  # Cores to bind to Gres resource
    "File": S_P_STRING,  # Path to Gres device
    "Files": S_P_STRING,  # Path to Gres device
    "Flags": S_P_STRING,  # GRES Flags
    "Link": S_P_STRING,  # Communication link IDs
    "Links": S_P_CSV,  # Communication link IDs
    "MultipleFiles": S_P_CSV,  # list of GRES device files
    "Type": S_P_STRING
}

gres_options = _gres_options.copy()
gres_options.update({
    "Name": S_P_ARRAY,
    "NodeName": S_P_ARRAY
})

gres_nodename_options = _gres_options.copy()
gres_nodename_options.update({
    "NodeName": S_P_STRING,
    "Name": S_P_STRING
})

gres_name_options = _gres_options.copy()
gres_name_options.update({
    "Name": S_P_STRING
})

# From
# https://github.com/SchedMD/slurm/blob/slurm-<VERSION>/src/plugins/mpi/pmix/mpi_pmix.c#L83
mpi_options = {
    "PMIxCliTmpDirBase": S_P_STRING,
    "PMIxCollFence": S_P_STRING,
    "PMIxDebug": S_P_UINT32,
    "PMIxDirectConn": S_P_BOOLEAN,
    "PMIxDirectConnEarly": S_P_BOOLEAN,
    "PMIxDirectConnUCX": S_P_BOOLEAN,
    "PMIxDirectSameArch": S_P_BOOLEAN,
    "PMIxEnv": S_P_STRING,
    "PMIxFenceBarrier": S_P_BOOLEAN,
    "PMIxNetDevicesUCX": S_P_STRING,
    "PMIxShareServerTopology": S_P_BOOLEAN,
    "PMIxTimeout": S_P_UINT32,
    "PMIxTlsUCX": S_P_CSV
}

# src/common/oci_config.c
oci_options = {
    "ContainerPath": S_P_STRING,
    "CreateEnvFile": S_P_STRING,
    "DisableHooks": S_P_STRING,
    "EnvExclude": S_P_STRING,
    "MountSpoolDir": S_P_STRING,
    "RunTimeCreate": S_P_STRING,
    "RunTimeDelete": S_P_STRING,
    "RunTimeKill": S_P_STRING,
    "RunTimeEnvExclude": S_P_STRING,
    "RunTimeQuery": S_P_STRING,
    "RunTimeRun": S_P_STRING,
    "RunTimeStart": S_P_STRING,
    "SrunPath": S_P_STRING,
    "SrunArgs": S_P_LIST,
    "DisableCleanup": S_P_BOOLEAN,
    "StdIODebug": S_P_STRING,
    "SyslogDebug": S_P_STRING,
    "FileDebug": S_P_STRING,
    "DebugFlags": S_P_STRING,
    "IgnoreFileConfigJson": S_P_BOOLEAN
}

# From
# src/plugins/acct_gather_*/*
acct_gather_options = {
    "EnergyIPMIDriverType": S_P_UINT32,
    "EnergyIPMIDisableAutoProbe": S_P_UINT32,
    "EnergyIPMIDriverAddress": S_P_UINT32,
    "EnergyIPMIRegisterSpacing": S_P_UINT32,
    "EnergyIPMIDriverDevice": S_P_STRING,
    "EnergyIPMIProtocolVersion": S_P_UINT32,
    "EnergyIPMIUsername": S_P_STRING,
    "EnergyIPMIPassword": S_P_STRING,
    "EnergyIPMIPrivilegeLevel": S_P_UINT32,
    "EnergyIPMIAuthenticationType": S_P_UINT32,
    "EnergyIPMICipherSuiteId": S_P_UINT32,
    "EnergyIPMISessionTimeout": S_P_UINT32,
    "EnergyIPMIRetransmissionTimeout": S_P_UINT32,
    "EnergyIPMIWorkaroundFlags": S_P_UINT32,
    "EnergyIPMIRereadSdrCache": S_P_BOOLEAN,
    "EnergyIPMIIgnoreNonInterpretableSensors": S_P_BOOLEAN,
    "EnergyIPMIBridgeSensors": S_P_BOOLEAN,
    "EnergyIPMIInterpretOemData": S_P_BOOLEAN,
    "EnergyIPMISharedSensors": S_P_BOOLEAN,
    "EnergyIPMIDiscreteReading": S_P_BOOLEAN,
    "EnergyIPMIIgnoreScanningDisabled": S_P_BOOLEAN,
    "EnergyIPMIAssumeBmcOwner": S_P_BOOLEAN,
    "EnergyIPMIEntitySensorNames": S_P_BOOLEAN,
    "EnergyIPMIFrequency": S_P_UINT32,
    "EnergyIPMICalcAdjustment": S_P_BOOLEAN,
    "EnergyIPMIPowerSensors": S_P_STRING,
    "EnergyIPMITimeout": S_P_UINT32,
    "EnergyIPMIVariable": S_P_STRING,
    "ProfileHDF5Dir": S_P_STRING,
    "ProfileHDF5Default": S_P_STRING,
    "ProfileInfluxDBDatabase": S_P_STRING,
    "ProfileInfluxDBDefault": S_P_STRING,
    "ProfileInfluxDBFrequency": S_P_UINT32,
    "ProfileInfluxDBHost": S_P_STRING,
    "ProfileInfluxDBPass": S_P_STRING,
    "ProfileInfluxDBRTPolicy": S_P_STRING,
    "ProfileInfluxDBTimeout": S_P_UINT32,
    "ProfileInfluxDBUser": S_P_STRING,
    "InterconnectOFEDPort": S_P_UINT32,
    "InfinibandOFEDPort": S_P_UINT32,
    "SysfsInterfaces": S_P_STRING
}

# src/plugins/burst_buffer/common/burst_buffer_common.c
burst_buffer_options = {
    "AllowUsers": S_P_STRING,
    "CreateBuffer": S_P_STRING,
    "DefaultPool": S_P_STRING,
    "DenyUsers": S_P_STRING,
    "DestroyBuffer": S_P_STRING,
    "Directive": S_P_STRING,
    "Flags": S_P_STRING,
    "GetSysState": S_P_STRING,
    "GetSysStatus": S_P_STRING,
    "Granularity": S_P_STRING,
    "OtherTimeout": S_P_UINT32,
    "PollInterval": S_P_UINT32,
    "Pools": S_P_STRING,
    "StageInTimeout": S_P_UINT32,
    "StageOutTimeout": S_P_UINT32,
    "StartStageIn": S_P_STRING,
    "StartStageOut": S_P_STRING,
    "StopStageIn": S_P_STRING,
    "StopStageOut": S_P_STRING,
    "ValidateTimeout": S_P_UINT32
}

# src/plugins/node_features/helpers/node_features_helpers.c
helpers_options = {
    "AllowUserBoot": S_P_STRING,
    "BootTime": S_P_UINT32,
    "ExecTime": S_P_UINT32,
    "Feature": S_P_ARRAY,
    "MutuallyExclusive": S_P_LIST,
    "NodeName": S_P_ARRAY
}

helpers_nodename_options = {
    "AllowUserBoot": S_P_STRING,
    "BootTime": S_P_UINT32,
    "ExecTime": S_P_UINT32,
    "Feature": S_P_CSV,
    "MutuallyExclusive": S_P_LIST
}

helpers_feature_options = {
    "Feature": S_P_CSV,
    "Helper": S_P_STRING,
    "Flags": S_P_STRING
}

# src/plugins/namespace/tmpfs/read_jcconf.c
job_container_options = {
    "AutoBasePath": S_P_BOOLEAN,
    "InitScript": S_P_STRING,
    "BasePath": S_P_ARRAY,
    "EntireStepInNS": S_P_BOOLEAN,
    "NodeName": S_P_ARRAY,
    "Shared": S_P_BOOLEAN,
    "CloneNSScript": S_P_STRING,
    "CloneNSEpilog": S_P_STRING,
    "CloneNSScript_Wait": S_P_UINT32,
    "CloneNSEpilog_Wait": S_P_UINT32
}

job_container_nodename_options = {
    "AutoBasePath": S_P_BOOLEAN,
    "BasePath": S_P_STRING,
    "Dirs": S_P_STRING,
    "EntireStepInNS": S_P_BOOLEAN,
    "NodeName": S_P_STRING,
    "Shared": S_P_BOOLEAN,
    "CloneNSScript": S_P_STRING,
    "CloneNSEpilog": S_P_STRING,
    "CloneNSScript_Wait": S_P_UINT32,
    "CloneNSEpilog_Wait": S_P_UINT32
}

job_container_basename_options = {
    "BasePath": S_P_STRING,
    "Dirs": S_P_STRING
}

# src/plugins/topology/tree/switch_record.c
topology_options = {
    "SwitchName": S_P_ARRAY,
    "LinkSpeed": S_P_UINT32,
    "Nodes": S_P_STRING,
    "Switches": S_P_STRING,
    "BlockName": S_P_ARRAY,
    "BlockSizes": S_P_STRING
}

topology_switchname_options = {
    "SwitchName": S_P_STRING,
    "LinkSpeed": S_P_UINT32,
    "Nodes": S_P_STRING,
    "Switches": S_P_STRING
}

topology_blockname_options = {
    "BlockName": S_P_STRING,
    "BlockSizes": S_P_STRING,
    "Nodes": S_P_STRING
}

all_confs = {
    "slurm": slurm_options,
    "slurmdbd": slurmdbd_options,
    "cgroup": cgroup_options,
    "mpi": mpi_options,
    "oci": oci_options,
    "acct_gather": acct_gather_options,
    "burst_buffer": burst_buffer_options,
    "helpers": helpers_options,
    "job_container": job_container_options,
    "topology": topology_options,
    "gres": gres_options,
    # TOD: GRES can have different combinations, NodeName and Name
    # https://slurm.schedmd.com/gres.conf.html#SECTION_EXAMPLES
    "slurm->PartitionName": slurm_partitionname_options,
    "slurm->NodeName": slurm_nodename_options,
    "slurm->DownNodes": slurm_downnodes_options,
    "slurm->NodeSet": slurm_nodeset_options,
    "gres->Name": gres_name_options,
    "gres->NodeName": gres_nodename_options,
    "job_container->NodeName": job_container_nodename_options,
    "job_container->BaseName": job_container_basename_options,
    "topology->SwitchName": topology_switchname_options,
    "topology->BlockName": topology_blockname_options,
    "helpers->NodeName": helpers_nodename_options,
    "helpers->Feature": helpers_feature_options
}

_HOSTLIST_RE = re.compile(
    r'^(?P<prefix>[^\[\]]*)\[(?P<inner>[^\[\]]+)\](?P<suffix>.*)$')


def validate_config_types(conf_dict, conf_name, module):
    """Validate configuration keys and value types based on SlurmParserEnum."""
    current_conf = all_confs.get(conf_name, {})
    if not current_conf:
        return {'invalid_keys': [], 'type_errors': []}
    invalid_keys = list(
        set(conf_dict.keys()).difference(set(current_conf.keys())))
    type_errors = []

    for key, value in conf_dict.items():
        if key in current_conf:
            expected_type_enum = current_conf[key]
            expected_type = expected_type_enum.value
            error = None

            if expected_type == "int":
                if not isinstance(value, int):
                    try:
                        int(str(value))
                    except (ValueError, TypeError):
                        error = f"Expected integer, got {type(value).__name__}"

            elif expected_type == "float":
                if not isinstance(value, (int, float)):
                    try:
                        float(str(value))
                    except (ValueError, TypeError):
                        error = f"Expected float, got {type(value).__name__}"

            elif expected_type == "bool":
                if not isinstance(value, bool):
                    if str(value).lower() not in [
                            'yes', 'no', 'true', 'false', '0', '1']:
                        error = f"Expected boolean, got {type(value).__name__}"

            elif expected_type == "str":
                if not isinstance(value, str):
                    error = f"Expected string, got {type(value).__name__}"

            elif expected_type == "csv":
                if not isinstance(value, str):
                    error = f"Expected CSV string, got {type(value).__name__}"

            elif expected_type == "list":
                if not isinstance(value, list):
                    error = f"Expected list, got {type(value).__name__}"

            elif expected_type == "array":
                if not isinstance(value, list):
                    error = f"Expected array (list), got {type(value).__name__}"
                elif value:
                    if not all(isinstance(item, dict) for item in value):
                        error = "Expected array of dicts, got mixed types"
                    else:
                        # Recursively validate each dict item in the array
                        for item in value:
                            item_result = validate_config_types(
                                item, f"{conf_name}->{key}", module)
                            type_errors.extend(item_result['type_errors'])
                            invalid_keys.extend(item_result['invalid_keys'])
            elif expected_type == "object":
                if not isinstance(value, (dict, object)):
                    error = f"Expected object, got {type(value).__name__}"

            if error:
                type_errors.append({  # format for error message in input validator
                    "error_key": "omnia_config.yml",
                    "error_msg": f"{conf_name}.conf: '{key}': {error} -> '{value}'",
                    "error_value": "slurm_cluster->config_sources"
                })
    return {
        'invalid_keys': list(invalid_keys),
        'type_errors': type_errors
    }


def parse_slurm_conf(file_path, conf_name, validate):
    """Parses the slurm.conf file and returns it as a dictionary."""
    current_conf = all_confs.get(conf_name, {})
    slurm_dict = OrderedDict()
    dup_keys = []

    if not os.path.exists(file_path):
        raise FileNotFoundError(f"{file_path} not found.")

    with open(file_path, 'r', encoding='utf-8') as f:
        for line in f:
            # handles any comment after the data
            line = line.split('#')[0].strip()
            if not line:
                continue
            # Split the line by one or more spaces
            items = line.split()
            tmp_dict = OrderedDict()
            for item in items:
                # Split only on the first '=' to allow '=' inside the value
                key, value = item.split('=', 1)
                tmp_dict[key.strip()] = value.strip()
            skey = list(tmp_dict.keys())[0]
            if validate and skey not in current_conf:
                raise ValueError(
                    f"Invalid key while parsing {file_path}: {skey}")
            if current_conf.get(skey) == SlurmParserEnum.S_P_ARRAY or len(tmp_dict) > 1:
                slurm_dict[list(tmp_dict.keys())[0]] = list(
                    slurm_dict.get(list(tmp_dict.keys())[0], [])) + [tmp_dict]
            elif current_conf.get(skey) == SlurmParserEnum.S_P_CSV:
                existing_values = [
                    v.strip() for v in slurm_dict.get(
                        skey, "").split(',') if v.strip()]
                new_values = [v.strip()
                              for v in tmp_dict[skey].split(',') if v.strip()]
                slurm_dict[skey] = ",".join(
                    list(
                        dict.fromkeys(
                            existing_values +
                            new_values)))
            elif current_conf.get(skey) == SlurmParserEnum.S_P_LIST:
                slurm_dict[skey] = list(slurm_dict.get(
                    skey, [])) + list(tmp_dict.values())
            else:
                if skey in slurm_dict:
                    dup_keys.append(skey)
                else:
                    slurm_dict.update(tmp_dict)
    return slurm_dict, dup_keys


def expand_hostlist(expr):
    """
    Expand simple Slurm-style hostlist expressions, e.g.:
      dev[0-2,5,10-12] -> [dev0, dev1, dev2, dev5, dev10, dev11, dev12]
    If no brackets, returns [expr].
    """
    m = _HOSTLIST_RE.match(expr)
    if not m:
        return [expr]

    prefix = m.group("prefix")
    inner = m.group("inner")
    suffix = m.group("suffix")

    hosts = []
    for part in inner.split(','):
        part = part.strip()
        if '-' in part:
            start_s, end_s = part.split('-', 1)
            width = max(len(start_s), len(end_s))
            start = int(start_s)
            end = int(end_s)
            step = 1 if end >= start else -1
            for i in range(start, end + step, step):
                hosts.append(f"{prefix}{str(i).zfill(width)}{suffix}")
        else:
            # single index
            width = len(part)
            i = int(part)
            hosts.append(f"{prefix}{str(i).zfill(width)}{suffix}")
    return hosts


================================================
FILE: common/library/module_utils/input_validation/common_utils/timezone.txt
================================================
Africa/Abidjan
Africa/Accra
Africa/Addis_Ababa
Africa/Algiers
Africa/Asmara
Africa/Asmera
Africa/Bamako
Africa/Bangui
Africa/Banjul
Africa/Bissau
Africa/Blantyre
Africa/Brazzaville
Africa/Bujumbura
Africa/Cairo
Africa/Casablanca
Africa/Ceuta
Africa/Conakry
Africa/Dakar
Africa/Dar_es_Salaam
Africa/Djibouti
Africa/Douala
Africa/El_Aaiun
Africa/Freetown
Africa/Gaborone
Africa/Harare
Africa/Johannesburg
Africa/Juba
Africa/Kampala
Africa/Khartoum
Africa/Kigali
Africa/Kinshasa
Africa/Lagos
Africa/Libreville
Africa/Lome
Africa/Luanda
Africa/Lubumbashi
Africa/Lusaka
Africa/Malabo
Africa/Maputo
Africa/Maseru
Africa/Mbabane
Africa/Mogadishu
Africa/Monrovia
Africa/Nairobi
Africa/Ndjamena
Africa/Niamey
Africa/Nouakchott
Africa/Ouagadougou
Africa/Porto-Novo
Africa/Sao_Tome
Africa/Timbuktu
Africa/Tripoli
Africa/Tunis
Africa/Windhoek
America/Adak
America/Anchorage
America/Anguilla
America/Antigua
America/Araguaina
America/Argentina/Buenos_Aires
America/Argentina/Catamarca
America/Argentina/ComodRivadavia
America/Argentina/Cordoba
America/Argentina/Jujuy
America/Argentina/La_Rioja
America/Argentina/Mendoza
America/Argentina/Rio_Gallegos
America/Argentina/Salta
America/Argentina/San_Juan
America/Argentina/San_Luis
America/Argentina/Tucuman
America/Argentina/Ushuaia
America/Aruba
America/Asuncion
America/Atikokan
America/Atka
America/Bahia
America/Bahia_Banderas
America/Barbados
America/Belem
America/Belize
America/Blanc-Sablon
America/Boa_Vista
America/Bogota
America/Boise
America/Buenos_Aires
America/Cambridge_Bay
America/Campo_Grande
America/Cancun
America/Caracas
America/Catamarca
America/Cayenne
America/Cayman
America/Chicago
America/Chihuahua
America/Coral_Harbour
America/Cordoba
America/Costa_Rica
America/Creston
America/Cuiaba
America/Curacao
America/Danmarkshavn
America/Dawson
America/Dawson_Creek
America/Denver
America/Detroit
America/Dominica
America/Edmonton
America/Eirunepe
America/El_Salvador
America/Ensenada
America/Fort_Nelson
America/Fort_Wayne
America/Fortaleza
America/Glace_Bay
America/Godthab
America/Goose_Bay
America/Grand_Turk
America/Grenada
America/Guadeloupe
America/Guatemala
America/Guayaquil
America/Guyana
America/Halifax
America/Havana
America/Hermosillo
America/Indiana/Indianapolis
America/Indiana/Knox
America/Indiana/Marengo
America/Indiana/Petersburg
America/Indiana/Tell_City
America/Indiana/Vevay
America/Indiana/Vincennes
America/Indiana/Winamac
America/Indianapolis
America/Inuvik
America/Iqaluit
America/Jamaica
America/Jujuy
America/Juneau
America/Kentucky/Louisville
America/Kentucky/Monticello
America/Knox_IN
America/Kralendijk
America/La_Paz
America/Lima
America/Los_Angeles
America/Louisville
America/Lower_Princes
America/Maceio
America/Managua
America/Manaus
America/Marigot
America/Martinique
America/Matamoros
America/Mazatlan
America/Mendoza
America/Menominee
America/Merida
America/Metlakatla
America/Mexico_City
America/Miquelon
America/Moncton
America/Monterrey
America/Montevideo
America/Montreal
America/Montserrat
America/Nassau
America/New_York
America/Nipigon
America/Nome
America/Noronha
America/North_Dakota/Beulah
America/North_Dakota/Center
America/North_Dakota/New_Salem
America/Nuuk
America/Ojinaga
America/Panama
America/Pangnirtung
America/Paramaribo
America/Phoenix
America/Port-au-Prince
America/Port_of_Spain
America/Porto_Acre
America/Porto_Velho
America/Puerto_Rico
America/Punta_Arenas
America/Rainy_River
America/Rankin_Inlet
America/Recife
America/Regina
America/Resolute
America/Rio_Branco
America/Rosario
America/Santa_Isabel
America/Santarem
America/Santiago
America/Santo_Domingo
America/Sao_Paulo
America/Scoresbysund
America/Shiprock
America/Sitka
America/St_Barthelemy
America/St_Johns
America/St_Kitts
America/St_Lucia
America/St_Thomas
America/St_Vincent
America/Swift_Current
America/Tegucigalpa
America/Thule
America/Thunder_Bay
America/Tijuana
America/Toronto
America/Tortola
America/Vancouver
America/Virgin
America/Whitehorse
America/Winnipeg
America/Yakutat
America/Yellowknife
Antarctica/Casey
Antarctica/Davis
Antarctica/DumontDUrville
Antarctica/Macquarie
Antarctica/Mawson
Antarctica/McMurdo
Antarctica/Palmer
Antarctica/Rothera
Antarctica/South_Pole
Antarctica/Syowa
Antarctica/Troll
Antarctica/Vostok
Arctic/Longyearbyen
Asia/Aden
Asia/Almaty
Asia/Amman
Asia/Anadyr
Asia/Aqtau
Asia/Aqtobe
Asia/Ashgabat
Asia/Ashkhabad
Asia/Atyrau
Asia/Baghdad
Asia/Bahrain
Asia/Baku
Asia/Bangkok
Asia/Barnaul
Asia/Beirut
Asia/Bishkek
Asia/Brunei
Asia/Calcutta
Asia/Chita
Asia/Choibalsan
Asia/Chongqing
Asia/Chungking
Asia/Colombo
Asia/Dacca
Asia/Damascus
Asia/Dhaka
Asia/Dili
Asia/Dubai
Asia/Dushanbe
Asia/Famagusta
Asia/Gaza
Asia/Harbin
Asia/Hebron
Asia/Ho_Chi_Minh
Asia/Hong_Kong
Asia/Hovd
Asia/Irkutsk
Asia/Istanbul
Asia/Jakarta
Asia/Jayapura
Asia/Jerusalem
Asia/Kabul
Asia/Kamchatka
Asia/Karachi
Asia/Kashgar
Asia/Kathmandu
Asia/Katmandu
Asia/Khandyga
Asia/Kolkata
Asia/Krasnoyarsk
Asia/Kuala_Lumpur
Asia/Kuching
Asia/Kuwait
Asia/Macao
Asia/Macau
Asia/Magadan
Asia/Makassar
Asia/Manila
Asia/Muscat
Asia/Nicosia
Asia/Novokuznetsk
Asia/Novosibirsk
Asia/Omsk
Asia/Oral
Asia/Phnom_Penh
Asia/Pontianak
Asia/Pyongyang
Asia/Qatar
Asia/Qostanay
Asia/Qyzylorda
Asia/Rangoon
Asia/Riyadh
Asia/Saigon
Asia/Sakhalin
Asia/Samarkand
Asia/Seoul
Asia/Shanghai
Asia/Singapore
Asia/Srednekolymsk
Asia/Taipei
Asia/Tashkent
Asia/Tbilisi
Asia/Tehran
Asia/Tel_Aviv
Asia/Thimbu
Asia/Thimphu
Asia/Tokyo
Asia/Tomsk
Asia/Ujung_Pandang
Asia/Ulaanbaatar
Asia/Ulan_Bator
Asia/Urumqi
Asia/Ust-Nera
Asia/Vientiane
Asia/Vladivostok
Asia/Yakutsk
Asia/Yangon
Asia/Yekaterinburg
Asia/Yerevan
Atlantic/Azores
Atlantic/Bermuda
Atlantic/Canary
Atlantic/Cape_Verde
Atlantic/Faeroe
Atlantic/Faroe
Atlantic/Jan_Mayen
Atlantic/Madeira
Atlantic/Reykjavik
Atlantic/South_Georgia
Atlantic/St_Helena
Atlantic/Stanley
Australia/ACT
Australia/Adelaide
Australia/Brisbane
Australia/Broken_Hill
Australia/Canberra
Australia/Currie
Australia/Darwin
Australia/Eucla
Australia/Hobart
Australia/LHI
Australia/Lindeman
Australia/Lord_Howe
Australia/Melbourne
Australia/NSW
Australia/North
Australia/Perth
Australia/Queensland
Australia/South
Australia/Sydney
Australia/Tasmania
Australia/Victoria
Australia/West
Australia/Yancowinna
Brazil/Acre
Brazil/DeNoronha
Brazil/East
Brazil/West
CET
CST6CDT
Canada/Atlantic
Canada/Central
Canada/Eastern
Canada/Mountain
Canada/Newfoundland
Canada/Pacific
Canada/Saskatchewan
Canada/Yukon
Chile/Continental
Chile/EasterIsland
Cuba
EET
EST
EST5EDT
Egypt
Eire
Etc/GMT
Etc/GMT+0
Etc/GMT+1
Etc/GMT+10
Etc/GMT+11
Etc/GMT+12
Etc/GMT+2
Etc/GMT+3
Etc/GMT+4
Etc/GMT+5
Etc/GMT+6
Etc/GMT+7
Etc/GMT+8
Etc/GMT+9
Etc/GMT-0
Etc/GMT-1
Etc/GMT-10
Etc/GMT-11
Etc/GMT-12
Etc/GMT-13
Etc/GMT-14
Etc/GMT-2
Etc/GMT-3
Etc/GMT-4
Etc/GMT-5
Etc/GMT-6
Etc/GMT-7
Etc/GMT-8
Etc/GMT-9
Etc/GMT0
Etc/Greenwich
Etc/UCT
Etc/UTC
Etc/Universal
Etc/Zulu
Europe/Amsterdam
Europe/Andorra
Europe/Astrakhan
Europe/Athens
Europe/Belfast
Europe/Belgrade
Europe/Berlin
Europe/Bratislava
Europe/Brussels
Europe/Bucharest
Europe/Budapest
Europe/Busingen
Europe/Chisinau
Europe/Copenhagen
Europe/Dublin
Europe/Gibraltar
Europe/Guernsey
Europe/Helsinki
Europe/Isle_of_Man
Europe/Istanbul
Europe/Jersey
Europe/Kaliningrad
Europe/Kiev
Europe/Kirov
Europe/Lisbon
Europe/Ljubljana
Europe/London
Europe/Luxembourg
Europe/Madrid
Europe/Malta
Europe/Mariehamn
Europe/Minsk
Europe/Monaco
Europe/Moscow
Europe/Nicosia
Europe/Oslo
Europe/Paris
Europe/Podgorica
Europe/Prague
Europe/Riga
Europe/Rome
Europe/Samara
Europe/San_Marino
Europe/Sarajevo
Europe/Saratov
Europe/Simferopol
Europe/Skopje
Europe/Sofia
Europe/Stockholm
Europe/Tallinn
Europe/Tirane
Europe/Tiraspol
Europe/Ulyanovsk
Europe/Uzhgorod
Europe/Vaduz
Europe/Vatican
Europe/Vienna
Europe/Vilnius
Europe/Volgograd
Europe/Warsaw
Europe/Zagreb
Europe/Zaporozhye
Europe/Zurich
GB
GB-Eire
GMT
GMT+0
GMT-0
GMT0
Greenwich
HST
Hongkong
Iceland
Indian/Antananarivo
Indian/Chagos
Indian/Christmas
Indian/Cocos
Indian/Comoro
Indian/Kerguelen
Indian/Mahe
Indian/Maldives
Indian/Mauritius
Indian/Mayotte
Indian/Reunion
Iran
Israel
Jamaica
Japan
Kwajalein
Libya
MET
MST
MST7MDT
Mexico/BajaNorte
Mexico/BajaSur
Mexico/General
NZ
NZ-CHAT
Navajo
PRC
PST8PDT
Pacific/Apia
Pacific/Auckland
Pacific/Bougainville
Pacific/Chatham
Pacific/Chuuk
Pacific/Easter
Pacific/Efate
Pacific/Enderbury
Pacific/Fakaofo
Pacific/Fiji
Pacific/Funafuti
Pacific/Galapagos
Pacific/Gambier
Pacific/Guadalcanal
Pacific/Guam
Pacific/Honolulu
Pacific/Johnston
Pacific/Kiritimati
Pacific/Kosrae
Pacific/Kwajalein
Pacific/Majuro
Pacific/Marquesas
Pacific/Midway
Pacific/Nauru
Pacific/Niue
Pacific/Norfolk
Pacific/Noumea
Pacific/Pago_Pago
Pacific/Palau
Pacific/Pitcairn
Pacific/Pohnpei
Pacific/Ponape
Pacific/Port_Moresby
Pacific/Rarotonga
Pacific/Saipan
Pacific/Samoa
Pacific/Tahiti
Pacific/Tarawa
Pacific/Tongatapu
Pacific/Truk
Pacific/Wake
Pacific/Wallis
Pacific/Yap
Poland
Portugal
ROC
ROK
Singapore
Turkey
UCT
US/Alaska
US/Aleutian
US/Arizona
US/Central
US/East-Indiana
US/Eastern
US/Hawaii
US/Indiana-Starke
US/Michigan
US/Mountain
US/Pacific
US/Samoa
UTC
Universal
W-SU
WET
Zulu

================================================
FILE: common/library/module_utils/input_validation/common_utils/validation_utils.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# pylint: disable=import-error,no-name-in-module,too-many-positional-arguments,too-many-arguments
"""
This module contains utility functions for input validation.
"""
import os
import ipaddress
import subprocess
import yaml
import json
from ansible.module_utils.input_validation.common_utils import en_us_validation_msg
from ansible.module_utils.input_validation.common_utils import config

def load_yaml_as_json(yaml_file, omnia_base_dir, project_name, logger, module):
    """
    Loads a YAML file as JSON.

    Args:
        yaml_file (str): The path to the YAML file.
        omnia_base_dir (str): The base directory of the Omnia project.
        project_name (str): The name of the project.
        logger (Logger): A logger instance.
        module (AnsibleModule): An Ansible module instance.

    Returns:
        dict: The loaded YAML data as JSON.

    Raises:
        FileNotFoundError: If the YAML file is not found.
        yaml.YAMLError: If there is a syntax error in the YAML file.
    """
    try:
        if is_file_encrypted(yaml_file):
            data = process_encrypted_file(yaml_file, omnia_base_dir, project_name, logger, module)
            return data
        with open(yaml_file, "r") as f:
            data = yaml.safe_load(f)
            return data
    except FileNotFoundError:
        error_message = f"File {yaml_file} not found"
        logger.error(error_message)
        module.fail_json(msg=error_message)
    except yaml.YAMLError as e:
        error_parts = []
        error_parts.append(f"Syntax error when loading YAML file '{yaml_file}'")

        if hasattr(e, 'problem_mark'):
            error_parts.append(
                f"at line {e.problem_mark.line + 1}, column {e.problem_mark.column + 1}")
            if hasattr(e, 'problem'):
                error_parts.append(f"Problem: {e.problem}")
            if hasattr(e, 'context'):
                error_parts.append(f"Context: {e.context}")
        else:
            error_parts.append(str(e))

        error_context = " | ".join(error_parts)
        logger.error(error_context)
        # Instead of raising exception immediately, return None to indicate
        # validation failure, in case there are other validations to perform
        return None
    
# def check_bmc_range_against_admin_network(bmc_range, admin_static_range, admin_dynamic_range, admin_ip):
#     """
#     Validates that the BMC static range does not overlap with:
#     - Admin static range
#     - Admin dynamic range
#     - Primary OIM admin IP

#     Args:
#         bmc_range (str): BMC static range (start-end format)
#         admin_static_range (str): Admin static range (start-end format)
#         admin_dynamic_range (str): Admin dynamic range (start-end format)
#         admin_ip (str): Primary OIM admin IP (single IP)

#     Returns:
#         list: A list of error strings if overlaps are found.
#     """
#     errors = []

#     if not bmc_range or bmc_range in ["", "N/A"]:
#         return errors  # Skip empty or N/A values

#     # Check overlap with admin static and dynamic ranges
#     for field_name, admin_range in [("admin static_range", admin_static_range), ("admin dynamic_range", admin_dynamic_range)]:
#         if admin_range and admin_range not in ["", "N/A"]:
#             has_overlap, _ = check_overlap([bmc_range, admin_range])
#             if has_overlap:
#                 errors.append(f"BMC range {bmc_range} overlaps with {field_name}: {admin_range}")

#     # Check containment of primary_oim_admin_ip
#     if admin_ip and is_ip_within_range(bmc_range, admin_ip):
#         errors.append(f"BMC range {bmc_range} contains primary_oim_admin_ip: {admin_ip}")

    return errors

def create_error_msg(key, value, msg):
    """
    Creates an error message dictionary.

    Args:
        key (str): The key of the error.
        value (str): The value of the error.
        msg (str): The error message.

    Returns:
        dict: The error message dictionary.
    """
    return {"error_key": key, "error_value": value, "error_msg": msg}

def create_file_path(input_file_path, other_file):
    """
    Creates a file path by replacing the last part of the input file path with another file name.

    Args:
        input_file_path (str): The input file path.
        other_file (str): The name of the other file.

    Returns:
        str: The new file path.
    """
    path_parts = input_file_path.split("/")
    path_parts[-1] = other_file
    final_path = ("/").join(path_parts)
    return final_path

def extract_arch_from_fg(fg_name):
    """
    Extracts the architecture suffix from a functional group name, if present.

    Args:
        fg_name (str): The functional group name.

    Returns:
        str or None: The architecture suffix if found, otherwise None.
    """
    valid_arches = {"x86_64", "aarch64"}
    for arch in valid_arches:
        if fg_name.endswith(f"_{arch}"):
            return arch
    return None

def load_json(file_path):
    """
    Load JSON data from a file.

    Args:
        file_path (str): The path to the JSON file.

    Returns:
        dict: The loaded JSON data.

    Raises:
        FileNotFoundError: If the file is not found.
        ValueError: If the JSON parsing fails.
    """
    try:
        with open(file_path, 'r') as file:
            return json.load(file)
    except FileNotFoundError as exc:
        raise FileNotFoundError(f"Error: File '{file_path}' not found.") from exc
    except json.JSONDecodeError as exc:
        raise ValueError(f"Error: Failed to parse JSON in file '{file_path}'.") from exc

def contains_software(softwares, name):
    """
    Checks if a software is present in the list of softwares.

    Args:
        softwares (list): The list of softwares.
        name (str): The name of the software to check.

    Returns:
        bool: True if the software is present, False otherwise.
    """
    return any(name in software["name"].lower() for software in softwares)

def check_mandatory_fields(mandatory_fields, data, errors):
    """
    Checks if all mandatory fields are present in the data.

    Args:
        mandatory_fields (list): The list of mandatory fields.
        data (dict): The data to check.
        errors (list): The list of errors.

    Returns:
        None
    """
    for field in mandatory_fields:
        if is_string_empty(data[field]):
            errors.append(
                create_error_msg(
                    field, data[field], en_us_validation_msg.MANDATORY_FIELD_FAIL_MSG
                )
            )

# Below functions used to deal with encrypted files
# (Check if a file is encrypted, if yes then get the vault password,
# decrypt file, load data, encrypt file again)
def is_file_encrypted(file_path):
    """
    Checks if a file is encrypted.

    Args:
        file_path (str): The path to the file.

    Returns:
        bool: True if the file is encrypted, False otherwise.
    """
    try:
        with open(file_path, 'r') as file:
            first_line = file.readline().strip()
            return first_line.startswith('$ANSIBLE_VAULT')
    except (IOError, OSError):
        return False

def process_encrypted_file(yaml_file, omnia_base_dir, project_name, logger, module):
    """
    Decrypts an encrypted file, loads the data, and encrypts the file again.

    Args:
        yaml_file (str): The path to the encrypted file.
        omnia_base_dir (str): The base directory of the Omnia project.
        project_name (str): The name of the project.
        logger (Logger): A logger instance.
        module (AnsibleModule): An Ansible module instance.

    Returns:
        dict: The loaded data from the encrypted file.
    """
    vault_password_file = config.get_vault_password(yaml_file)
    decrypted_file = decrypt_file(omnia_base_dir, project_name, yaml_file, vault_password_file)
    if decrypted_file:
        try:
            with open(yaml_file, "r") as f:
                data = yaml.safe_load(f)
                encrypt_file(omnia_base_dir, project_name, yaml_file, vault_password_file)
                return data
        except FileNotFoundError:
            logger.error("File {%s} not found" % yaml_file)
            module.fail_json(msg="File {%s} not found" % (yaml_file))
        except yaml.YAMLError as e:
            logger.error(f"Error loading YAML: {e}")
            module.fail_json(f"Error loading YAML: {e}")
    else:
        unable_to_decrypt_fail_msg = (
            f"Error occured when attempting to decrypt file. "
            f"Please check that the assoicated vault file exists for {yaml_file}")
        logger.error(unable_to_decrypt_fail_msg)
        module.fail_json(unable_to_decrypt_fail_msg)

def run_subprocess(cmd):
    """
    Runs a subprocess command and returns True if successful, False otherwise.

    Args:
        cmd (list): The command to run.

    Returns:
        bool: True if the command was successful, False otherwise.
    """
    try:
        subprocess.run(
            cmd,
            check=True,
            stdout=subprocess.PIPE,
            stderr=subprocess.PIPE,
            text=True,
        )
        return True
    except subprocess.CalledProcessError:
        return False

def encrypt_file(omnia_base_dir, project_name, vault_file, vault_password_file):
    """
    Encrypts a file using Ansible Vault.

    Args:
        omnia_base_dir (str): The base directory of the Omnia project.
        project_name (str): The name of the project.
        vault_file (str): The path to the file to encrypt.
        vault_password_file (str): The path to the Ansible Vault password file.

    Returns:
        bool: True if the encryption was successful, False otherwise.
    """
    password_full_path = omnia_base_dir + project_name + "/" + vault_password_file
    cmd = [
        "ansible-vault",
        "encrypt",
        vault_file,
        "--vault-password-file",
        password_full_path,
    ]
    return run_subprocess(cmd)

def decrypt_file(omnia_base_dir, project_name, vault_file, vault_password_file):
    """
    Decrypts a file using Ansible Vault.

    Args:
        omnia_base_dir (str): The base directory of the Omnia project.
        project_name (str): The name of the project.
        vault_file (str): The path to the file to decrypt.
        vault_password_file (str): The path to the Ansible Vault password file.

    Returns:
        bool: True if the decryption was successful, False otherwise.
    """
    password_full_path = omnia_base_dir + project_name + "/" + vault_password_file
    cmd = [
        "ansible-vault",
        "decrypt",
        vault_file,
        "--vault-password-file",
        password_full_path,
    ]
    return run_subprocess(cmd)

# Below are common functions used in L2 validation (logical_validation.py)
def is_string_empty(value):
    """
    Checks if a string is empty.

    Args:
        value (str): The string to check.

    Returns:
        bool: True if the string is empty, False otherwise.
    """
    if value is None:
        return True
    if not isinstance(value, str):
        return False
    return len(value.strip()) < 1

def verify_path(file_path):
    """
    Verifies if a file exists at the given path.

    Args:
        file_path (str): The path to the file.

    Returns:
        bool: True if the file exists, False otherwise.
    """
    if not os.path.exists(file_path):
        return False
    return os.path.isfile(file_path)

def validate_default_lease_time(default_lease_time):
    """
    Validates the default lease time.

    Args:
        default_lease_time (int): The default lease time.

    Returns:
        bool: True if the default lease time is valid, False otherwise.
    """
    return 21600 <= int(default_lease_time) <= 31536000


# Checks if the password meets the specified requirements:
# Length of at least 8 characters. Does not contain '-', '\', "'", or '"'.
def is_valid_password(password):
    """
    Validates the password.

    Args:
        password (str): The password to validate.

    Returns:
        bool: True if the password is valid, False otherwise.
    """
    if not isinstance(password, str):
        return False
    if len(password) <= 8 or len(password) >= 30:
        return False
    invalid_chars = ["-", "\\", "'", '"']
    for char in invalid_chars:
        if char in password:
            return False
    return True

def validate_username(username, min_username_length, max_length):
    """
    Validates the username.

    Args:
        username (str): The username to validate.
        min_username_length (int): The minimum length of the username.
        max_length (int): The maximum length of the username.

    Returns:
        bool: True if the username is valid, False otherwise.
    """
    if not (min_username_length <= len(username) < max_length):
        return False

    forbidden_characters = {"-", "\\", "'", '"'}
    if any(char in username for char in forbidden_characters):
        return False

    return True


# check_overlap(ip_list: list[dict[str, str]]) -> tuple[bool, list[tuple]]:
def check_overlap(ip_list):
    """
    Checks for IP range overlap.

    Args:
        ip_list (list): A list of IP ranges and CIDR.

    Returns:
        tuple: A tuple containing a boolean indicating if there is an overlap,
            and a list of overlapping IP ranges.
    """
    ranges = []
    overlaps = []

    # Convert IP ranges and CIDR to ipaddress objects
    for item in ip_list:
        if item in ('', 'N/A'):
            continue
        if "-" in item:
            start_ip, end_ip = item.split("-")
            start_ip = ipaddress.ip_address(start_ip)
            end_ip = ipaddress.ip_address(end_ip)
            # Convert IP range to a list of networks
            networks = list(ipaddress.summarize_address_range(start_ip, end_ip))
            ranges.extend(networks)
        else:
            ranges.append(ipaddress.ip_network(item, strict=False))

    # Check for overlaps using the overlaps() method
    for i in range(len(ranges)):
        for j in range(i + 1, len(ranges)):
            if ranges[i].overlaps(ranges[j]):
                overlaps.append((ranges[i], ranges[j]))

    return len(overlaps) > 0, overlaps

def key_value_exists(list_of_dicts, key, value) -> bool:
    """
    Check if a key-value pair exists in a list of dictionaries.

    Args:
        list_of_dicts (List[Dict[Any, Any]]): The list of dictionaries to search.
        key (Any): The key to search for.
        value (Any): The value to search for.

    Returns:
        bool: True if the key-value pair exists, False otherwise.
    """
    for dictionary in list_of_dicts:
        if dictionary.get(key) == value:
            return True
    return False

def validate_ipv4(ip: str) -> bool:
    """
    Validates if the given IP is a valid IPv4 address.

    Args:
        ip (str): The given IP address to be validated

    Returns:
        bool: True if valid IPv4 address, False otherwise.
    """
    try:
        ipaddress.IPv4Address(ip)
        return True
    except ipaddress.AddressValueError:
        return False

def validate_ipv4_range(ip_range) -> bool:
    """
    Validates if the given IP range is a valid IPv4 range.

    Args:
        ip_range (str): The IP range to be validated.

    Returns:
        bool: True if the IP range is valid, False otherwise.
    """
    try:
        start, end = ip_range.split('-')
        start_ip = ipaddress.IPv4Address(start)
        end_ip = ipaddress.IPv4Address(end)

        if end_ip >= start_ip:
            return True
        return False
    except ValueError:
        return False

def validate_netmask_bits(bits):
    """
    Validates if the given netmask bits are within the valid range.

    Args:
        bits (str): The netmask bits to be validated.

    Returns:
        bool: True if the netmask bits are valid, False otherwise.
    """
    try:
        bits_int = int(bits)
        if 1 <= bits_int <= 32:
            return True
        return False
    except (ValueError, TypeError):
        return False

def is_range_within_subnet(ip_range, reference_ip, netmask_bits):
    """
    Validates that the given IP range falls within the subnet
    derived from reference_ip and netmask_bits.

    Args:
        ip_range (str): IP range in "start_ip-end_ip" format.
        reference_ip (str): A reference IP in the subnet (e.g., primary_oim_admin_ip).
        netmask_bits (str or int): The CIDR prefix length (e.g., "24").

    Returns:
        bool: True if both start and end IPs are within the subnet, False otherwise.
    """
    try:
        network = ipaddress.IPv4Network(f"{reference_ip}/{netmask_bits}", strict=False)
        parts = ip_range.split("-")
        if len(parts) != 2:
            return False
        start_ip = ipaddress.IPv4Address(parts[0].strip())
        end_ip = ipaddress.IPv4Address(parts[1].strip())
        return start_ip in network and end_ip in network
    except (ValueError, TypeError):
        return False

def check_bmc_static_range_overlap(static_range, static_range_group_mapping) -> list:
    """
    Checks if the given static BMC range overlaps with any of the ranges in other groups.

    Args:
        static_range (str): The static BMC range to check for overlaps.
        static_range_group_mapping (Dict[str, str]):
            A dictionary mapping group names to their corresponding bmc static ranges.

    Returns:
        list: A list of group names that have overlapping ranges with the given static_range.
    """
    grp_overlaps = []
    ip_ranges = [static_range]
    for grp, grp_static_range in static_range_group_mapping.items():
        ip_ranges.append(grp_static_range)
        overlap_exists, _ = check_overlap(ip_ranges)
        if overlap_exists:
            grp_overlaps.append(grp)
        ip_ranges.pop()

    return grp_overlaps

def get_interface_ips_and_netmasks(interface):
    """
    Returns all IPv4 addresses and their netmask bits for an interface.

    Args:
        interface (str): Interface name (e.g., "eno3").

    Returns:
        list of tuples: [(ip, netmask_bits), ...]
        Empty list if no IPv4 found.
    """
    results = []
    try:
        result = subprocess.run(
            ["ip", "-4", "addr", "show", interface],
            capture_output=True, text=True, check=True
        )

        for line in result.stdout.splitlines():
            line = line.strip()
            if line.startswith("inet "):
                ip_with_mask = line.split()[1] 
                ip_interface = ipaddress.ip_interface(ip_with_mask)
                results.append((str(ip_interface.ip), str(ip_interface.network.prefixlen)))

        return results
    except Exception:
        return []

def check_port_overlap(port_ranges) -> bool:
    """
    Check if any of the port ranges in the given string overlap.

    Args:
        port_ranges (str): A string of port ranges separated by commas.

    Returns:
        bool: True if any of the port ranges overlap, False otherwise.
    """
    ports = set()
    for port_range in port_ranges.split(','):
        if '-' in port_range:
            start, end = map(int, port_range.split('-'))
            for port in range(start, end + 1):
                if port in ports:
                    return True
                ports.add(port)
        else:
            if ':' not in port_range and port_range.isdigit():
                port = int(port_range)
            else:
                port = port_range
            if port in ports:
                return True
            ports.add(port)
    return False

def check_port_ranges(port_ranges) -> bool:
    """
    Check if any of the port ranges are invalid.

    Args:
        port_ranges (str): A string of port ranges separated by commas.

    Returns:
        bool: False if any of the port ranges are invalid, True otherwise.
    """
    for port_range in port_ranges.split(','):
        if '-' in port_range:
            start, end = map(int, port_range.split('-'))
            if start > end:
                return False

    return True

def is_ip_within_range(ip_range, ip):
    """
    Check if a given IP falls within a specified IP range.

    Args:
        ip_range (str): The IP range in format "start_ip-end_ip"
            (e.g., "192.168.1.10-192.168.1.50").
        ip (str): The IP address to check.

    Returns:
        bool: True if the IP is within the range, False otherwise.
    """
    start_ip, end_ip = [ipaddress.IPv4Address(part.strip()) for part in ip_range.split('-')]
    target_ip = ipaddress.IPv4Address(ip)
    return start_ip <= target_ip <= end_ip

def is_ip_in_subnet(admin_oim_ip, netmask_bits, vip_address):
    """
    Check if a given IP falls within the subnet defined by the admin OIM IP and netmask bits.

    Args:
        admin_oim_ip (str): The admin OIM IP address.
        netmask_bits (int or str): The netmask bits (e.g., 20 for /20).
        vip_address (str): The IP address to check.

    Returns:
        bool: True if the IP is within the subnet, False otherwise.
    """
    # Create the subnet from the reference IP and netmask bits
    subnet = ipaddress.IPv4Network(f"{admin_oim_ip}/{netmask_bits}", strict=False)
    ip = ipaddress.IPv4Address(vip_address)
    return ip in subnet

def flatten_sub_groups(sub_groups):
    """
    Flattens a list of sub-groups,
        where each sub-group can contain multiple groups separated by commas.

    Args:
        sub_groups (list): A list of sub-groups.

    Returns:
        list: A flattened list of individual groups.
    """
    result = []
    for group in sub_groups:
        result.extend(group.split(','))
    return result

def validate_cluster_items(cluster_items, json_file_path):
    """
    Validates the cluster items in a JSON file based on predefined type requirements.

    Args:
        cluster_items (list): A list of cluster items to validate.
        json_file_path (str): The path to the JSON file.

    Returns:
        tuple: A tuple containing two lists - one for successful validations and one for failures.
    """
    failures = []
    successes = []

    is_additional_packages = json_file_path.endswith('additional_packages.json')
    allowed_types_for_additional = {'rpm', 'image'}

    for item in cluster_items:
        item_type = item.get('type')

        if is_additional_packages and item_type not in allowed_types_for_additional:
            failures.append(
                f"Failed. Type '{item_type}' is not allowed in '{json_file_path}'. "
                f"Only 'rpm' and 'image' types are permitted in this file.")
            continue

        required_fields = config.TYPE_REQUIREMENTS.get(item_type)

        if not required_fields:
            failures.append(f"Failed. Unknown type '{item_type}' in file '{json_file_path}'.")
            continue

        # Handle types with either/or fields (like tag/digest for image)
        if any(isinstance(field, list) for field in required_fields):
            # Separate flat and alternative fields
            flat_fields = [f for f in required_fields if isinstance(f, str)]
            alt_fields_groups = [f for f in required_fields if isinstance(f, list)]

            missing_flat = [f for f in flat_fields if f not in item]
            has_one_alt = any(any(alt in item for alt in group) for group in alt_fields_groups)

            if missing_flat or not has_one_alt:
                failures.append(
                    f"Failed. Missing required properties for '{item_type}' in file "
                    f"'{json_file_path}'.")
            else:
                successes.append(f"Success. Valid '{item_type}' item in file '{json_file_path}'.")
        else:
            missing_fields = [field for field in required_fields if field not in item]
            if missing_fields:
                failures.append(
                    f"Failed. Missing {missing_fields} for '{item_type}' in file "
                    f"'{json_file_path}'.")
            else:
                successes.append(f"Success. Valid '{item_type}' item in file '{json_file_path}'.")

    return successes, failures

def validate_softwaresubgroup_entries(
        software_name, json_path, json_data, validation_results, failures):
    """
    Validates the entries for a specific software subgroup in a JSON file.

    Args:
        software_name (str): The name of the software.
        json_path (str): The path to the JSON file.
        json_data (dict): The JSON data.
        validation_results (list): A list to store the validation results.
        failures (list): A list to store the failure messages.

    Returns:
        tuple: A tuple containing the updated validation results and failures.
    """
    try:
        #check for the key in software.json
        if software_name in json_data:
            validation_results.append((json_path, True))
            if 'cluster' in json_data[software_name]:
                cluster_items = json_data[software_name]['cluster']
                item_successes, item_failures = validate_cluster_items(cluster_items, json_path)
                if item_failures:
                    failures.extend(item_failures)
            else:
                failures.append(
                    f"Failed. Invalid JSON format for: '{software_name}'"
                    f" in file '{json_path}'. Cluster property is missing")
        else:
            validation_results.append((json_path, False))
            failures.append(
                f"Failed. Invalid software name: '{software_name}' in file '{json_path}'.")

    except KeyError as e:
        failures.append(f"Failed. Missing key {str(e)} in file '{json_path}'.")
    except TypeError as e:
        failures.append(f"Failed. Type error in file '{json_path}': {str(e)}")
    except Exception as e:
        failures.append(f"Failed. Unexpected error in file '{json_path}': {str(e)}")

    return validation_results, failures


================================================
FILE: common/library/module_utils/input_validation/schema/__init__.py
================================================


================================================
FILE: common/library/module_utils/input_validation/schema/additional_software.json
================================================
{
  "$schema": "http://json-schema.org/draft-07/schema#",
  "type": "object",
  "patternProperties": {
    "^[a-zA-Z0-9_,]+$": {
      "type": "object",
      "properties": {
        "cluster": {
          "type": "array",
          "minItems": 0,
          "items": {
            "type": "object",
            "oneOf": [
              {
                "properties": {
                  "package": { "type": "string", "minLength": 1 },
                  "type": { "const": "rpm" },
                  "repo_name": { "type": "string", "minLength": 1 },
                  "reboot_required": { "type": "boolean", "minLength": 1 }
                },
                "required": ["package", "type", "repo_name"],
                "additionalProperties": false
              },
              {
                "properties": {
                  "package_list": {
                    "type": "array",
                    "items": { "type": "string", "minLength": 1 },
                    "minItems": 1
                  },
                  "type": { "const": "rpm_list" },
                  "repo_name": { "type": "string", "minLength": 1 },
                  "reboot_required": { "type": "boolean", "minLength": 1 }
                },
                "required": ["package_list", "type", "repo_name"],
                "additionalProperties": false
              },
              {
                "properties": {
                  "package": { "type": "string", "minLength": 1 },
                  "type": { "const": "image" },
                  "tag": { "type": "string" },
                  "digest": { "type": "string" }
                },
                "required": ["package", "type"],
                "oneOf": [
                  { "required": ["tag"] },
                  { "required": ["digest"] }
                ],
                "additionalProperties": false
              }
            ]
          }
        }
      },
      "required": ["cluster"],
      "additionalProperties": false
    }
  },
  "additionalProperties": false
}


================================================
FILE: common/library/module_utils/input_validation/schema/build_stream_config.json
================================================
{
  "$schema": "http://json-schema.org/draft-07/schema#",
  "title": "Build Stream Configuration",
  "type": "object",
  "properties": {
    "enable_build_stream": {
      "type": "boolean",
      "description": "Enable or disable build stream pipeline. Accepted values: true or false. Default: false"
    },
    "build_stream_host_ip": {
      "type": "string",
      "description": "Mandatory when build stream is enabled: Build Stream API server host IP. Must be either admin IP or public IP of OIM. Accepted values: valid IPv4 address"
    },
    "build_stream_port": {
      "type": ["integer", "string"],
      "description": "Build Stream API server port. Accepted values: valid port number (1-65535). Default: 443"
    },
    "aarch64_inventory_host_ip": {
      "type": ["string", "null"],
      "pattern": "^$|^((25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)\\.){3}(25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)$",
      "description": "AArch64 inventory host IP for aarch64 builds. Must be in same subnet as OIM admin IP. Accepted values: valid IPv4 address, empty string, or null"
    }
  },
  "allOf": [
    {
      "if": {
        "properties": {
          "enable_build_stream": { "const": true }
        },
        "required": ["enable_build_stream"]
      },
      "then": {
        "required": ["enable_build_stream", "build_stream_host_ip", "build_stream_port"],
        "properties": {
          "build_stream_host_ip": {
            "type": "string",
            "pattern": "^((25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)\\.){3}(25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)$"
          },
          "build_stream_port": {
            "type": "integer",
            "minimum": 1,
            "maximum": 65535
          }
        }
      },
      "else": {
        "required": ["enable_build_stream"]
      }
    }
  ],
  "additionalProperties": false
}


================================================
FILE: common/library/module_utils/input_validation/schema/credential_rules.json
================================================
{
      "provision_password": {
        "minLength": 8,
        "maxLength": 32,
        "pattern": "^[^-,\\'\"]+$",
        "description": "Password required during OS provisioning for root users. Length must be between 8 and 32 characters and must not contain commas (,), hyphens (-), single quotes ('), or double quotes (\\\")."
      },
      "bmc_username": {
        "minLength": 1,
        "maxLength": 64,
        "pattern": "^[^\\\\\\-'\"]+$",
        "description": "Username for BMC (idrac) access. The same credentials must be used across all servers. Length must be between 1 and 64 characters."
      },
      "bmc_password": {
        "minLength": 3,
        "maxLength": 32,
        "pattern": "^(?!.*[-\\\\'\"]).*$",
        "description": "Password required for BMC (idrac) access. Length must be between 3 and 32 characters and must not contain commas (,), hyphens (-), single quotes ('), or double quotes (\\\")."
      },
      "pulp_password": {
        "minLength": 8,
        "maxLength": 32,
        "pattern": "^[^-,\\'\"]+$",
        "description": "Pulp required for setting up Pulp container. Length must be between 8 and 32 characters and must not contain commas (,), hyphens (-), single quotes ('), or double quotes (\\\")."
      },
      "docker_username": {
        "minLength": 4,
        "maxLength": 32,
        "pattern": "^(?:[a-z0-9_.]+|[a-zA-Z0-9._%+-]+@[a-zA-Z0-9.-]+\\.[a-zA-Z]{2,})$",
        "description": "Username for Dockerhub account. This will be used for Docker login. Length must be between 4 and 32 characters."
      },
      "docker_password": {
        "minLength": 8,
        "maxLength": 128,
        "pattern": "^[a-zA-Z0-9!@#$%^&*()_+=,.?<>;:{}\\[\\]|-]{6,128}$",
        "description": "Password for Dockerhub account. Length must be between 8 and 128 characters and can contain letters, numbers, and special characters."
      },
      "postgres_user": {
        "minLength": 4,
        "maxLength": 32,
        "pattern": "^(?!root$)[A-Za-z0-9_]{4,32}$",
        "description": "Username for Postgres DB. Cannot be 'root'. Allowed characters: letters, digits, and underscore (_). Length must be between 4 and 32 characters."
      },
      "postgres_password": {
        "minLength": 8,
        "maxLength": 128,
        "pattern": "^[a-zA-Z0-9!#$^&*()_+=,.?<>;{}\\[\\]|]{6,128}$",
        "description": "Password for Postgres DB. Length must be between 8 and 128 characters and can contain letters, numbers, and special characters from !  #  $  %  ^  &  *  (  )  _  +  =  ,  .  ?  <  >  ;  {  }  [  ]  |"
      },
      "slurm_db_password": {
        "minLength": 8,
        "maxLength": 32,
        "description": "SlurmDB password must not contain special characters like hyphens (-), single quotes ('), double quotes (\") or backslashes (\\). Length must be between 8 and 32 characters.",
        "pattern": "^(?:[^\\-\\'\\\"\\\\]*)?$"

      },
      "openldap_db_username": {
        "minLength": 4,
        "maxLength": 64,
        "pattern": "^[^;\\[\\]`]+$",
        "description": "Username for OpenLDAP database admin. Must not contain semicolons (;), square brackets ([]), or backticks (`). Length must be between 4 and 64 characters."
      },
      "openldap_db_password": {
        "minLength": 8,
        "maxLength": 32,
        "pattern": "^[^\\-\\'\\\"@\\\\]*$",
        "description": "Password for OpenLDAP database admin. Must not contain hyphens (-), single quotes ('), double quotes (\"), at symbols (@), or backslashes (\\). Length must be between 8 and 32 characters."
      },
      "openldap_config_username": {
        "minLength": 4,
        "maxLength": 64,
        "pattern": "^[^;\\[\\]`]+$",
        "description": "Username for OpenLDAP configuration admin. Must not contain semicolons (;), square brackets ([]), or backticks (`). Length must be between 4 and 64 characters."
      },
      "openldap_config_password": {
        "minLength": 8,
        "maxLength": 32,
        "pattern": "^[^\\-\\'\\\"@\\\\]*$",
        "description": "Password for OpenLDAP configuration admin. Must not contain hyphens (-), single quotes ('), double quotes (\"), at symbols (@), or backslashes (\\). Length must be between 8 and 32 characters."
      },
      "openldap_monitor_password": {
        "minLength": 8,
        "maxLength": 32,
        "pattern": "^[^\\-\\'\\\"@\\\\]*$",
        "description": "Password for OpenLDAP monitor admin. Must not contain hyphens (-), single quotes ('), double quotes (\"), at symbols (@), or backslashes (\\). Length must be between 8 and 32 characters."
      },
      "mysqldb_user": {
        "minLength": 2,
        "maxLength": 32,
        "pattern": "^(?!root$)[^\\\\\\-'\"]+$",
        "description": "Username for MySQL Database. Username should not be kept 'root'. This will be used for MySQL Database login. Must not contain backslashes (\\), hyphens (-), single quotes ('), or double quotes (\\\"). Length must be between 2 and 32 characters."
      },
      "mysqldb_password": {
        "minLength": 2,
        "maxLength": 128,
        "pattern": "^[^\\\\\\-'\"]+$",
        "description": "Password for MySQL Database. Length must be between 2 and 128 characters and must not contain backslashes (\\), hyphens (-), single quotes ('), or double quotes (\\\")."
      },
      "mysqldb_root_password": {
        "minLength": 2,
        "maxLength": 128,
        "pattern": "^[^\\\\\\-'\"]+$",
        "description": "Password for MySQL Database. Length must be between 2 and 128 characters and must not contain backslashes (\\), hyphens (-), single quotes ('), or double quotes (\\\")."
      },
      "minio_s3_password": {
        "minLength": 5,
        "maxLength": 128,
        "pattern": "^(?!admin$)[^\\\\\\-'\"]+$",
        "description": "Password for Minio S3 bucket. Should not be kept 'admin. Length must be between 5 and 128 characters and must not contain backslashes (\\), hyphens (-), single quotes ('), or double quotes (\\\")."
      },
      "csi_username": {
        "minLength": 4,
        "maxLength": 64,
        "description": "Username for Powerscale UI. Must not contain semicolons (;), square brackets ([]), or backticks (`).",
        "pattern": "^[^;\\[\\]`]+$"
      },
      "csi_password": {
        "description": "Password for Powerscale UI. Can contain any characters. Length must be between 5 and 32.",
        "minLength": 5,
        "maxLength": 32,
        "pattern": "^.{5,32}$"
      },
      "ldms_sampler_password": {
        "minLength": 8,
        "maxLength": 64,
        "pattern": ".*",
        "description": "Password for LDMS Sampler. Length must be between 8 and 64 characters."
      },
      "build_stream_auth_username": {
        "minLength": 4,
        "maxLength": 64,
        "pattern": "^[a-zA-Z0-9_.-]+$",
        "description": "Username for Build Stream Oauth Registraration is Mandatory when Build Stream is enabled. Must contain only alphanumeric characters, underscores, dots, or hyphens. Length must be between 4 and 64 characters."
      },
      "build_stream_auth_password": {
        "minLength": 8,
        "maxLength": 128,
        "pattern": "^[^\\\\\\-'\"]+$",
        "description": "Password for Build Stream Oauth Registraration is Mndatory when Build Stream is enabled. Length must be between 8 and 128 characters and must not contain backslashes (\\), hyphens (-), single quotes ('), or double quotes (\")."
      },
      "gitlab_root_password": {
        "minLength": 8,
        "maxLength": 128,
        "pattern": "^[a-zA-Z0-9!@#$%^&*()_+=,.?<>;:{}\\[\\]|-]{8,128}$",
        "description": "Password for GitLab root user. Length must be between 8 and 128 characters and can contain letters, numbers, and special characters."
      }
  }


================================================
FILE: common/library/module_utils/input_validation/schema/functional_groups_config.json
================================================
{
  "$schema": "http://json-schema.org/draft-07/schema#",
  "type": "object",
  "properties": {
    "groups": {
      "type": "object",
      "patternProperties": {
        "^grp([1-9][0-9]?|0)$": {
          "type": "object",
          "properties": {
            "location_id": {
              "type": "string",
              "description": "Scalable unit and rack number range is 0-99. Format: SU-<n>.RACK-<n>",
              "pattern": "^(SU-\\d{1,2}\\.RACK-\\d{1,2})$"
            },
            "parent": {
              "type": "string",
              "pattern": "^[a-zA-Z0-9,]*$",
              "description": "List of service tag of associated active service node(s). This field will be mandatory for slurm_node related roles."
            }
          },
          "required": [
            "location_id",
            "parent"
          ]
        }
      },
      "additionalProperties": false
    },
    "functional_groups": {
      "type": "array",
      "items": {
        "type": "object",
        "properties": {
          "name": {
            "type": "string",
            "description": "Name of the functional_group, can be any of the following Omnia defined functional_group.",
            "enum": [
              "default_x86_64",
              "service_kube_node_x86_64",
              "service_kube_control_plane_x86_64",
              "service_kube_control_plane_first_x86_64",
              "login_node_x86_64",
              "login_node_aarch64",
              "login_compiler_node_x86_64",
              "login_compiler_node_aarch64",
              "slurm_control_node_x86_64",
              "default_aarch64",
              "slurm_node_x86_64",
              "slurm_node_aarch64"
            ]
          },
          "cluster_name": {
            "type": "string",
            "pattern": "^$|^[a-zA-Z0-9_]+$",
            "description": "Name of the cluster. Mandatory for service and compute kubernetes roles like 'service_kube_node', 'kube_node'."
          },
          "group": {
            "type": "array",
            "description": "List of groups defined by the user",
            "items": {
              "type": "string",
              "pattern": "^grp\\d{1,2}$"
            },
            "minItems": 1,
            "uniqueItems": true
          }
        },
        "required": [
          "name",
          "cluster_name",
          "group"
        ]
      },
      "minItems": 1,
      "uniqueItems": true,
      "maxItems": 100
    }
  },
  "required": [
    "functional_groups",
    "groups"
  ]
}


================================================
FILE: common/library/module_utils/input_validation/schema/gitlab_config.json
================================================
{
  "$schema": "http://json-schema.org/draft-07/schema#",
  "title": "GitLab Configuration",
  "type": "object",
  "properties": {
    "gitlab_host": {
      "type": "string",
      "minLength": 1,
      "description": "Target host IP for GitLab deployment. Accepted values: valid IPv4 address. Cannot be empty."
    },
    "gitlab_project_name": {
      "type": "string",
      "minLength": 1,
      "maxLength": 255,
      "pattern": "^[a-zA-Z0-9][a-zA-Z0-9_\\-\\.]*$",
      "description": "Name of the GitLab project Omnia will create/manage. Accepted values: alphanumeric string starting with a letter or digit. Default: omnia-catalog"
    },
    "gitlab_project_visibility": {
      "type": "string",
      "enum": ["private", "internal", "public"],
      "description": "GitLab project visibility. Accepted values: private, internal, public. Default: private"
    },
    "gitlab_default_branch": {
      "type": "string",
      "minLength": 1,
      "description": "Default branch for repository and API operations. Accepted values: valid git branch name. Default: main"
    },
    "gitlab_https_port": {
      "type": "integer",
      "minimum": 1,
      "maximum": 65535,
      "description": "HTTPS port exposed via GitLab NGINX. Accepted values: valid port number (1-65535). Default: 443"
    },
    "gitlab_ssh_port": {
      "type": "integer",
      "minimum": 1,
      "maximum": 65535,
      "description": "SSH port for git+ssh operations. Accepted values: valid port number (1-65535). Default: 22"
    },
    "gitlab_min_storage_gb": {
      "type": "integer",
      "minimum": 20,
      "description": "Minimum free disk space in GB required before install. Accepted values: integer >= 20. Default: 20"
    },
    "gitlab_min_memory_gb": {
      "type": "integer",
      "minimum": 1,
      "description": "Minimum RAM in GB required before install. Accepted values: integer >= 1. Default: 4"
    },
    "gitlab_min_cpu_cores": {
      "type": "integer",
      "minimum": 1,
      "description": "Minimum CPU core count required before install. Accepted values: integer >= 1. Default: 2"
    },
    "gitlab_puma_workers": {
      "type": "integer",
      "minimum": 1,
      "maximum": 64,
      "description": "Puma web worker count. Scale with CPU count. Accepted values: integer (1-64). Default: 2"
    },
    "gitlab_sidekiq_concurrency": {
      "type": "integer",
      "minimum": 1,
      "maximum": 200,
      "description": "Sidekiq background job concurrency. Accepted values: integer (1-200). Default: 10"
    },
    "oim_api_verify_ssl": {
      "type": "boolean",
      "description": "Verify SSL certificate when connecting to OIM API. Set to false for self-signed certs. Accepted values: true or false. Default: true"
    },
    "gitlab_cert_dir": {
      "type": "string",
      "minLength": 1,
      "description": "Directory on target host where cert artifacts are generated/stored. Accepted values: absolute path string. Default: /root/gitlab-certs"
    },
    "gitlab_ssl_dir": {
      "type": "string",
      "minLength": 1,
      "description": "Final SSL directory consumed by GitLab Omnibus. Accepted values: absolute path string. Default: /etc/gitlab/ssl"
    },
    "gitlab_repo_script_url": {
      "type": "string",
      "minLength": 1,
      "description": "URL for the GitLab package repository setup script. Override only when pinning to gitlab-ee or a specific version."
    }
  },
  "required": [
    "gitlab_host",
    "gitlab_project_name",
    "gitlab_project_visibility",
    "gitlab_default_branch",
    "gitlab_https_port"
  ],
  "additionalProperties": false
}


================================================
FILE: common/library/module_utils/input_validation/schema/high_availability_config.json
================================================
{
  "$schema": "http://json-schema.org/draft-07/schema#",
  "type": "object",
  "properties": {
    "service_k8s_cluster_ha": {
      "type": "array",
      "description": "High Availability (HA) configuration for Kubernetes (K8s) service clusters. Service K8s clusters are supported only in HA mode.",
      "minItems": 1,
      "items": {
        "type": "object",
        "properties": {
          "cluster_name": {
            "type": "string",
            "minLength": 1,
            "description": "Required. Name of the Kubernetes service cluster. Must match the service cluster name defined elsewhere."
          },
          "enable_k8s_ha": {
            "type": "boolean",
            "description": "Mandatory. Must be true. Service Kubernetes cluster deployment is supported only in HA mode."
          },
          "virtual_ip_address": {
            "type": "string",
            "description": "Mandatory. Virtual IP address used as the Kubernetes API endpoint for the service cluster setup.",
            "allOf": [
              { "pattern": "^[0-9.]+$" },
              { "format": "ipv4" }
            ]
          }
        },
        "required": [
          "cluster_name",
          "enable_k8s_ha",
          "virtual_ip_address"
        ],
        "additionalProperties": false
      }
    }
  },
  "required": [
    "service_k8s_cluster_ha"
  ],
  "additionalProperties": false
}
 

================================================
FILE: common/library/module_utils/input_validation/schema/k8s_scheduler.json
================================================
{
  "title": "omnia_config.yaml",
  "description": "Omina config related parameters",
  "type": "object",
  "properties": {
    "k8s_cni": {
      "description": "Kubernetes internal network for services",
      "enum":["calico"]
    },
    "k8s_service_addresses": {
      "description": "Kubernetes pod network CIDR for internal network",
      "type":"string",
      "pattern":"^(?:(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)\\.){3}(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)/[0-9]{1,2}$"
    },
    "pod_external_ip_range": {
      "description": "Kubernetes pod network CIDR for internal network",
      "type":"string",
      "pattern":"^(?:(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)\\.){3}(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)-(?:(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)\\.){3}(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)$|^(?:(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)\\.){3}(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)/[0-9]{1,2}$"
    },
    "k8s_pod_network_cidr": {
      "type": "string",
      "pattern":"^(?:(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)\\.){3}(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)/[0-9]{1,2}$",
      "description": "CIDR for the Kubernetes Pod Network (e.g., 10.233.64.0/18)"
    }
},
  "required": [
     "k8s_cni",
     "k8s_service_addresses",
     "k8s_pod_network_cidr",
     "pod_external_ip_range"
     ]
}


================================================
FILE: common/library/module_utils/input_validation/schema/local_repo_config.json
================================================
{
  "$schema": "http://json-schema.org/draft-07/schema#",
  "type": "object",
  "properties": {
    "user_registry": {
      "type": [
        "array",
        "null"
      ],
      "items": {
        "type": "object",
        "properties": {
          "host": {
            "type": "string",
            "minLength": 1,
            "pattern": "^[a-zA-Z0-9.-]+:[0-9]+$"
          },
          "cert_path": {
            "type": "string",
            "pattern": "^$|^[a-zA-Z0-9/\\._-]*\\.crt$"
          },
          "key_path": {
            "type": "string",
            "pattern": "^$|^[a-zA-Z0-9/\\._-]*\\.key$"
          }
        },
        "required": [
          "host"
        ],
        "allOf": [
          {
            "if": {
              "properties": {
                "cert_path": {
                  "minLength": 1
                }
              }
            },
            "then": {
              "properties": {
                "cert_path": {
                  "pattern": "^[a-zA-Z0-9/\\._-]*\\.crt$"
                }
              }
            }
          },
          {
            "if": {
              "properties": {
                "key_path": {
                  "minLength": 1
                }
              }
            },
            "then": {
              "properties": {
                "key_path": {
                  "pattern": "^[a-zA-Z0-9/\\._-]*\\.key$"
                }
              }
            }
          }
        ]
      }   
    },
    "user_repo_url_x86_64": {
      "type": [
        "array",
        "null"
      ],
      "items": {
        "type": "object",
        "properties": {
          "gpgkey": {
            "type": "string",
            "pattern": "^(|[a-zA-Z][a-zA-Z0-9+.-]*:\\/\\/\\S+)$"
          },
          "url": {
            "type": "string",
            "minLength": 1,
            "pattern": "^(https?:\\/\\/).+"
          },
          "name": {
            "type": "string",
            "minLength": 1,
            "pattern": "^(?!\\s*$).+"
          },
          "policy": {
            "type": "string",
            "enum": [
              "always",
              "partial",
              "never"
            ]
          },
          "sslcacert": {
            "type": [
              "string",
              "null"
            ]
          },
          "sslclientkey": {
            "type": [
              "string",
              "null"
            ]
          },
          "sslclientcert": {
            "type": [
              "string",
              "null"
            ]
          }
        },
        "required": [
          "gpgkey",
          "url",
          "name"
        ],
        "allOf": [
          {
            "if": {
              "required": [
                "sslcacert"
              ],
              "properties": {
                "sslcacert": {
                  "minLength": 1
                }
              }
            },
            "then": {
              "required": [
                "sslclientkey",
                "sslclientcert"
              ],
              "properties": {
                "sslclientkey": {
                  "minLength": 1
                },
                "sslclientcert": {
                  "minLength": 1
                }
              }
            }
          },
          {
            "if": {
              "required": [
                "sslclientkey"
              ],
              "properties": {
                "sslclientkey": {
                  "minLength": 1
                }
              }
            },
            "then": {
              "required": [
                "sslcacert",
                "sslclientcert"
              ],
              "properties": {
                "sslcacert": {
                  "minLength": 1
                },
                "sslclientcert": {
                  "minLength": 1
                }
              }
            }
          },
          {
            "if": {
              "required": [
                "sslclientcert"
              ],
              "properties": {
                "sslclientcert": {
                  "minLength": 1
                }
              }
            },
            "then": {
              "required": [
                "sslcacert",
                "sslclientkey"
              ],
              "properties": {
                "sslcacert": {
                  "minLength": 1
                },
                "sslclientkey": {
                  "minLength": 1
                }
              }
            }
          }
        ]
      }
    },
    "user_repo_url_aarch64": {
      "type": [
        "array",
        "null"
      ],
      "items": {
        "type": "object",
        "properties": {
          "gpgkey": {
            "type": "string",
            "pattern": "^(|[a-zA-Z][a-zA-Z0-9+.-]*:\\/\\/\\S+)$"
          },
          "url": {
            "type": "string",
            "minLength": 1,
            "pattern": "^(https?:\\/\\/).+"
          },
          "name": {
            "type": "string",
            "minLength": 1,
            "pattern": "^(?!\\s*$).+"
          },
          "policy": {
            "type": "string",
            "enum": [
              "always",
              "partial",
              "never"
            ]
          },
          "sslcacert": {
            "type": [
              "string",
              "null"
            ]
          },
          "sslclientkey": {
            "type": [
              "string",
              "null"
            ]
          },
          "sslclientcert": {
            "type": [
              "string",
              "null"
            ]
          }
        },
        "required": [
          "gpgkey",
          "url",
          "name"
        ],
        "allOf": [
          {
            "if": {
              "required": [
                "sslcacert"
              ],
              "properties": {
                "sslcacert": {
                  "minLength": 1
                }
              }
            },
            "then": {
              "required": [
                "sslclientkey",
                "sslclientcert"
              ],
              "properties": {
                "sslclientkey": {
                  "minLength": 1
                },
                "sslclientcert": {
                  "minLength": 1
                }
              }
            }
          },
          {
            "if": {
              "required": [
                "sslclientkey"
              ],
              "properties": {
                "sslclientkey": {
                  "minLength": 1
                }
              }
            },
            "then": {
              "required": [
                "sslcacert",
                "sslclientcert"
              ],
              "properties": {
                "sslcacert": {
                  "minLength": 1
                },
                "sslclientcert": {
                  "minLength": 1
                }
              }
            }
          },
          {
            "if": {
              "required": [
                "sslclientcert"
              ],
              "properties": {
                "sslclientcert": {
                  "minLength": 1
                }
              }
            },
            "then": {
              "required": [
                "sslcacert",
                "sslclientkey"
              ],
              "properties": {
                "sslcacert": {
                  "minLength": 1
                },
                "sslclientkey": {
                  "minLength": 1
                }
              }
            }
          }
        ]
      }
    },
    "rhel_os_url_x86_64": {
      "type": [
        "array",
        "null"
      ],
      "items": {
        "type": "object",
        "properties": {
          "gpgkey": {
            "type": "string",
            "pattern": "^(|[a-zA-Z][a-zA-Z0-9+.-]*:\\/\\/\\S+)$"
          },
          "url": {
            "type": "string",
            "minLength": 1,
            "pattern": "^(https?:\\/\\/).+"
          },
          "name": {
            "type": "string",
            "minLength": 1,
            "pattern": "^(?!\\s*$).+"
          },
          "policy": {
            "type": "string",
            "enum": [
              "always",
              "partial",
              "never"
            ]
          },
          "sslcacert": {
            "type": [
              "string",
              "null"
            ]
          },
          "sslclientkey": {
            "type": [
              "string",
              "null"
            ]
          },
          "sslclientcert": {
            "type": [
              "string",
              "null"
            ]
          }
        },
        "required": [
          "gpgkey",
          "url",
          "name"
        ],
        "allOf": [
          {
            "if": {
              "required": [
                "sslcacert"
              ],
              "properties": {
                "sslcacert": {
                  "minLength": 1
                }
              }
            },
            "then": {
              "required": [
                "sslclientkey",
                "sslclientcert"
              ],
              "properties": {
                "sslclientkey": {
                  "minLength": 1
                },
                "sslclientcert": {
                  "minLength": 1
                }
              }
            }
          },
          {
            "if": {
              "required": [
                "sslclientkey"
              ],
              "properties": {
                "sslclientkey": {
                  "minLength": 1
                }
              }
            },
            "then": {
              "required": [
                "sslcacert",
                "sslclientcert"
              ],
              "properties": {
                "sslcacert": {
                  "minLength": 1
                },
                "sslclientcert": {
                  "minLength": 1
                }
              }
            }
          },
          {
            "if": {
              "required": [
                "sslclientcert"
              ],
              "properties": {
                "sslclientcert": {
                  "minLength": 1
                }
              }
            },
            "then": {
              "required": [
                "sslcacert",
                "sslclientkey"
              ],
              "properties": {
                "sslcacert": {
                  "minLength": 1
                },
                "sslclientkey": {
                  "minLength": 1
                }
              }
            }
          }
        ]
      }
    },
    "rhel_os_url_aarch64": {
      "type": [
        "array",
        "null"
      ],
      "items": {
        "type": "object",
        "properties": {
          "gpgkey": {
            "type": "string",
            "pattern": "^(|[a-zA-Z][a-zA-Z0-9+.-]*:\\/\\/\\S+)$"
          },
          "url": {
            "type": "string",
            "minLength": 1,
            "pattern": "^(https?:\\/\\/).+"
          },
          "name": {
            "type": "string",
            "minLength": 1,
            "pattern": "^(?!\\s*$).+"
          },
          "policy": {
            "type": "string",
            "enum": [
              "always",
              "partial",
              "never"
            ]
          },
          "sslcacert": {
            "type": [
              "string",
              "null"
            ]
          },
          "sslclientkey": {
            "type": [
              "string",
              "null"
            ]
          },
          "sslclientcert": {
            "type": [
              "string",
              "null"
            ]
          }
        },
        "required": [
          "gpgkey",
          "url",
          "name"
        ],
        "allOf": [
          {
            "if": {
              "required": [
                "sslcacert"
              ],
              "properties": {
                "sslcacert": {
                  "minLength": 1
                }
              }
            },
            "then": {
              "required": [
                "sslclientkey",
                "sslclientcert"
              ],
              "properties": {
                "sslclientkey": {
                  "minLength": 1
                },
                "sslclientcert": {
                  "minLength": 1
                }
              }
            }
          },
          {
            "if": {
              "required": [
                "sslclientkey"
              ],
              "properties": {
                "sslclientkey": {
                  "minLength": 1
                }
              }
            },
            "then": {
              "required": [
                "sslcacert",
                "sslclientcert"
              ],
              "properties": {
                "sslcacert": {
                  "minLength": 1
                },
                "sslclientcert": {
                  "minLength": 1
                }
              }
            }
          },
          {
            "if": {
              "required": [
                "sslclientcert"
              ],
              "properties": {
                "sslclientcert": {
                  "minLength": 1
                }
              }
            },
            "then": {
              "required": [
                "sslcacert",
                "sslclientkey"
              ],
              "properties": {
                "sslcacert": {
                  "minLength": 1
                },
                "sslclientkey": {
                  "minLength": 1
                }
              }
            }
          }
        ]
      }
    },
    "omnia_repo_url_rhel_x86_64": {
      "type": [
        "array",
        "null"
      ],
      "items": {
        "type": "object",
        "properties": {
          "url": {
            "type": "string",
            "pattern": "^https?:\\/\\/(?!\\s*$).+",
            "minLength": 1
          },
          "gpgkey": {
            "type": "string",
            "pattern": "^(|https?:\\/\\/\\S.+)$"
          },
          "sslcacert": {
            "type": [
              "string",
              "null"
            ]
          },
          "sslclientkey": {
            "type": [
              "string",
              "null"
            ]
          },
          "sslclientcert": {
            "type": [
              "string",
              "null"
            ]
          },
          "name": {
            "type": "string",
            "pattern": "^(?!\\s*$).+",
            "minLength": 1
          },
          "policy": {
            "enum": [
              "always",
              "partial",
              "never"
            ]
          }
        },
        "required": [
          "url",
          "gpgkey",
          "name"
        ],
        "allOf": [
          {
            "if": {
              "required": [
                "sslcacert"
              ],
              "properties": {
                "sslcacert": {
                  "minLength": 1
                }
              }
            },
            "then": {
              "required": [
                "sslclientkey",
                "sslclientcert"
              ],
              "properties": {
                "sslclientkey": {
                  "minLength": 1
                },
                "sslclientcert": {
                  "minLength": 1
                }
              }
            }
          },
          {
            "if": {
              "required": [
                "sslclientkey"
              ],
              "properties": {
                "sslclientkey": {
                  "minLength": 1
                }
              }
            },
            "then": {
              "required": [
                "sslcacert",
                "sslclientcert"
              ],
              "properties": {
                "sslcacert": {
                  "minLength": 1
                },
                "sslclientcert": {
                  "minLength": 1
                }
              }
            }
          },
          {
            "if": {
              "required": [
                "sslclientcert"
              ],
              "properties": {
                "sslclientcert": {
                  "minLength": 1
                }
              }
            },
            "then": {
              "required": [
                "sslcacert",
                "sslclientkey"
              ],
              "properties": {
                "sslcacert": {
                  "minLength": 1
                },
                "sslclientkey": {
                  "minLength": 1
                }
              }
            }
          }
        ]
      },
      "description": "URLs for repositories from which RPMs will be downloaded for Omnia features on RHEL, with SSL configuration options and policy."
    },
    "omnia_repo_url_rhel_aarch64": {
      "type": [
        "array",
        "null"
      ],
      "items": {
        "type": "object",
        "properties": {
          "url": {
            "type": "string",
            "pattern": "^https?:\\/\\/(?!\\s*$).+",
            "minLength": 1
          },
          "gpgkey": {
            "type": "string",
            "pattern": "^(|https?:\\/\\/\\S.+)$"
          },
          "sslcacert": {
            "type": [
              "string",
              "null"
            ]
          },
          "sslclientkey": {
            "type": [
              "string",
              "null"
            ]
          },
          "sslclientcert": {
            "type": [
              "string",
              "null"
            ]
          },
          "name": {
            "type": "string",
            "pattern": "^(?!\\s*$).+",
            "minLength": 1
          },
          "policy": {
            "enum": [
              "always",
              "partial",
              "never"
            ]
          }
        },
        "required": [
          "url",
          "gpgkey",
          "name"
        ],
        "allOf": [
          {
            "if": {
              "required": [
                "sslcacert"
              ],
              "properties": {
                "sslcacert": {
                  "minLength": 1
                }
              }
            },
            "then": {
              "required": [
                "sslclientkey",
                "sslclientcert"
              ],
              "properties": {
                "sslclientkey": {
                  "minLength": 1
                },
                "sslclientcert": {
                  "minLength": 1
                }
              }
            }
          },
          {
            "if": {
              "required": [
                "sslclientkey"
              ],
              "properties": {
                "sslclientkey": {
                  "minLength": 1
                }
              }
            },
            "then": {
              "required": [
                "sslcacert",
                "sslclientcert"
              ],
              "properties": {
                "sslcacert": {
                  "minLength": 1
                },
                "sslclientcert": {
                  "minLength": 1
                }
              }
            }
          },
          {
            "if": {
              "required": [
                "sslclientcert"
              ],
              "properties": {
                "sslclientcert": {
                  "minLength": 1
                }
              }
            },
            "then": {
              "required": [
                "sslcacert",
                "sslclientkey"
              ],
              "properties": {
                "sslcacert": {
                  "minLength": 1
                },
                "sslclientkey": {
                  "minLength": 1
                }
              }
            }
          }
        ]
      },
      "description": "URLs for repositories from which RPMs will be downloaded for Omnia features on RHEL, with SSL configuration options and policy."
    },
    "additional_repos_x86_64": {
      "type": [
        "array",
        "null"
      ],
      "items": {
        "type": "object",
        "properties": {
          "url": {
            "type": "string",
            "pattern": "^https?:\\/\\/(?!\\s*$).+",
            "minLength": 1
          },
          "gpgkey": {
            "type": "string",
            "pattern": "^(|[a-zA-Z][a-zA-Z0-9+.-]*:\\/\\/\\S+)$"
          },
          "name": {
            "type": "string",
            "pattern": "^(?!\\s*$).+",
            "minLength": 1
          },
          "sslcacert": {
            "type": [
              "string",
              "null"
            ]
          },
          "sslclientkey": {
            "type": [
              "string",
              "null"
            ]
          },
          "sslclientcert": {
            "type": [
              "string",
              "null"
            ]
          }
        },
        "required": [
          "url",
          "gpgkey",
          "name"
        ],
        "allOf": [
          {
            "if": {
              "required": [
                "sslcacert"
              ],
              "properties": {
                "sslcacert": {
                  "minLength": 1
                }
              }
            },
            "then": {
              "required": [
                "sslclientkey",
                "sslclientcert"
              ],
              "properties": {
                "sslclientkey": {
                  "minLength": 1
                },
                "sslclientcert": {
                  "minLength": 1
                }
              }
            }
          },
          {
            "if": {
              "required": [
                "sslclientkey"
              ],
              "properties": {
                "sslclientkey": {
                  "minLength": 1
                }
              }
            },
            "then": {
              "required": [
                "sslcacert",
                "sslclientcert"
              ],
              "properties": {
                "sslcacert": {
                  "minLength": 1
                },
                "sslclientcert": {
                  "minLength": 1
                }
              }
            }
          },
          {
            "if": {
              "required": [
                "sslclientcert"
              ],
              "properties": {
                "sslclientcert": {
                  "minLength": 1
                }
              }
            },
            "then": {
              "required": [
                "sslcacert",
                "sslclientkey"
              ],
              "properties": {
                "sslcacert": {
                  "minLength": 1
                },
                "sslclientkey": {
                  "minLength": 1
                }
              }
            }
          }
        ]
      },
      "description": "Optional list of additional repository URLs for x86_64 architecture. These repos are aggregated into a single Pulp repository."
    },
    "additional_repos_aarch64": {
      "type": [
        "array",
        "null"
      ],
      "items": {
        "type": "object",
        "properties": {
          "url": {
            "type": "string",
            "pattern": "^https?:\\/\\/(?!\\s*$).+",
            "minLength": 1
          },
          "gpgkey": {
            "type": "string",
            "pattern": "^(|[a-zA-Z][a-zA-Z0-9+.-]*:\\/\\/\\S+)$"
          },
          "name": {
            "type": "string",
            "pattern": "^(?!\\s*$).+",
            "minLength": 1
          },
          "sslcacert": {
            "type": [
              "string",
              "null"
            ]
          },
          "sslclientkey": {
            "type": [
              "string",
              "null"
            ]
          },
          "sslclientcert": {
            "type": [
              "string",
              "null"
            ]
          }
        },
        "required": [
          "url",
          "gpgkey",
          "name"
        ],
        "allOf": [
          {
            "if": {
              "required": [
                "sslcacert"
              ],
              "properties": {
                "sslcacert": {
                  "minLength": 1
                }
              }
            },
            "then": {
              "required": [
                "sslclientkey",
                "sslclientcert"
              ],
              "properties": {
                "sslclientkey": {
                  "minLength": 1
                },
                "sslclientcert": {
                  "minLength": 1
                }
              }
            }
          },
          {
            "if": {
              "required": [
                "sslclientkey"
              ],
              "properties": {
                "sslclientkey": {
                  "minLength": 1
                }
              }
            },
            "then": {
              "required": [
                "sslcacert",
                "sslclientcert"
              ],
              "properties": {
                "sslcacert": {
                  "minLength": 1
                },
                "sslclientcert": {
                  "minLength": 1
                }
              }
            }
          },
          {
            "if": {
              "required": [
                "sslclientcert"
              ],
              "properties": {
                "sslclientcert": {
                  "minLength": 1
                }
              }
            },
            "then": {
              "required": [
                "sslcacert",
                "sslclientkey"
              ],
              "properties": {
                "sslcacert": {
                  "minLength": 1
                },
                "sslclientkey": {
                  "minLength": 1
                }
              }
            }
          }
        ]
      },
      "description": "Optional list of additional repository URLs for aarch64 architecture. These repos are aggregated into a single Pulp repository."
    },
     "rhel_subscription_repo_config_x86_64": {
      "type": [
        "array",
        "null"
      ],
      "items": {
        "type": "object",
        "properties": {
          "url": {
            "type": "string",
            "minLength": 1,
            "pattern": "^(https?:\\/\\/).+"
          },
          "gpgkey": {
            "type": "string",
            "pattern": "^(|[a-zA-Z][a-zA-Z0-9+.-]*:\\/\\/\\S+)$"
          },
          "name": {
            "type": "string",
            "minLength": 1,
            "pattern": "^(?!\\s*$).+"
          },
          "policy": {
            "type": "string",
            "enum": [
              "always",
              "partial"
            ]
          },
          "caching": {
            "type": "boolean"
          },
          "sslcacert": {
            "type": [
              "string",
              "null"
            ]
          },
          "sslclientkey": {
            "type": [
              "string",
              "null"
            ]
          },
          "sslclientcert": {
            "type": [
              "string",
              "null"
            ]
          }
        },
        "required": [
          "url",
          "gpgkey",
          "name"
        ],
        "allOf": [
          {
            "if": {
              "required": [
                "sslcacert"
              ],
              "properties": {
                "sslcacert": {
                  "minLength": 1
                }
              }
            },
            "then": {
              "required": [
                "sslclientkey",
                "sslclientcert"
              ],
              "properties": {
                "sslclientkey": {
                  "minLength": 1
                },
                "sslclientcert": {
                  "minLength": 1
                }
              }
            }
          },
          {
            "if": {
              "required": [
                "sslclientkey"
              ],
              "properties": {
                "sslclientkey": {
                  "minLength": 1
                }
              }
            },
            "then": {
              "required": [
                "sslcacert",
                "sslclientcert"
              ],
              "properties": {
                "sslcacert": {
                  "minLength": 1
                },
                "sslclientcert": {
                  "minLength": 1
                }
              }
            }
          },
          {
            "if": {
              "required": [
                "sslclientcert"
              ],
              "properties": {
                "sslclientcert": {
                  "minLength": 1
                }
              }
            },
            "then": {
              "required": [
                "sslcacert",
                "sslclientkey"
              ],
              "properties": {
                "sslcacert": {
                  "minLength": 1
                },
                "sslclientkey": {
                  "minLength": 1
                }
              }
            }
          }
        ]
      },
      "description": "Optional configuration for overriding policy and caching settings for RHEL subscription-based repositories on x86_64 architecture."
    },
    "rhel_subscription_repo_config_aarch64": {
      "type": [
        "array",
        "null"
      ],
      "items": {
        "type": "object",
        "properties": {
          "url": {
            "type": "string",
            "minLength": 1,
            "pattern": "^(https?:\\/\\/).+"
          },
          "gpgkey": {
            "type": "string",
            "pattern": "^(|[a-zA-Z][a-zA-Z0-9+.-]*:\\/\\/\\S+)$"
          },
          "name": {
            "type": "string",
            "minLength": 1,
            "pattern": "^(?!\\s*$).+"
          },
          "policy": {
            "type": "string",
            "enum": [
              "always",
              "partial"
            ]
          },
          "caching": {
            "type": "boolean"
          },
          "sslcacert": {
            "type": [
              "string",
              "null"
            ]
          },
          "sslclientkey": {
            "type": [
              "string",
              "null"
            ]
          },
          "sslclientcert": {
            "type": [
              "string",
              "null"
            ]
          }
        },
        "required": [
          "url",
          "gpgkey",
          "name"
        ],
        "allOf": [
          {
            "if": {
              "required": [
                "sslcacert"
              ],
              "properties": {
                "sslcacert": {
                  "minLength": 1
                }
              }
            },
            "then": {
              "required": [
                "sslclientkey",
                "sslclientcert"
              ],
              "properties": {
                "sslclientkey": {
                  "minLength": 1
                },
                "sslclientcert": {
                  "minLength": 1
                }
              }
            }
          },
          {
            "if": {
              "required": [
                "sslclientkey"
              ],
              "properties": {
                "sslclientkey": {
                  "minLength": 1
                }
              }
            },
            "then": {
              "required": [
                "sslcacert",
                "sslclientcert"
              ],
              "properties": {
                "sslcacert": {
                  "minLength": 1
                },
                "sslclientcert": {
                  "minLength": 1
                }
              }
            }
          },
          {
            "if": {
              "required": [
                "sslclientcert"
              ],
              "properties": {
                "sslclientcert": {
                  "minLength": 1
                }
              }
            },
            "then": {
              "required": [
                "sslcacert",
                "sslclientkey"
              ],
              "properties": {
                "sslcacert": {
                  "minLength": 1
                },
                "sslclientkey": {
                  "minLength": 1
                }
              }
            }
          }
        ]
      },
      "description": "Optional configuration for overriding policy and caching settings for RHEL subscription-based repositories on aarch64 architecture."
    }
  },
  "required": [
    "omnia_repo_url_rhel_aarch64",
    "omnia_repo_url_rhel_x86_64"
  ],
  "additionalProperties": false
}


================================================
FILE: common/library/module_utils/input_validation/schema/network_spec.json
================================================
{
  "$schema": "http://json-schema.org/draft-07/schema#",
  "type": "object",
  "required": ["Networks"],
  "properties": {
    "Networks": {
      "type": "array",
      "minItems": 1,
      "contains": {
        "type": "object",
        "required": ["admin_network"]
      },
      "items": {
        "type": "object",
        "oneOf": [
          {
            "type": "object",
            "required": ["admin_network"],
            "properties": {
              "admin_network": {
                "type": "object",
                "required": [
                  "oim_nic_name",
                  "netmask_bits",
                  "primary_oim_admin_ip",
                  "primary_oim_bmc_ip",
                  "dynamic_range"
                ],
                "properties": {
                  "oim_nic_name": { "type": "string" },
                  "netmask_bits": {
                    "type": "string",
                    "pattern": "^(1[0-9]|2[0-9]|[1-9])$|^3[0-2]$"
                  },
                  "primary_oim_admin_ip": {
                    "type": "string",
                    "pattern": "^(?:(?:25[0-5]|2[0-4][0-9]|1?[0-9]{1,2})\\.){3}(?:25[0-5]|2[0-4][0-9]|1?[0-9]{1,2})$"
                  },
                  "primary_oim_bmc_ip": {
                    "type": "string",
                    "oneOf": [
                    {
                     "maxLength": 0
                    },
                    {
                      "minLength": 1,
                      "pattern": "^(?:(?:25[0-5]|2[0-4][0-9]|1?[0-9]{1,2})\\.){3}(?:25[0-5]|2[0-4][0-9]|1?[0-9]{1,2})$"
                    }
                    ]
                  },
                  "dynamic_range": {
                    "type": "string",
                    "pattern": "^(?:(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)\\.){3}(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)-(?:(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)\\.){3}(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)$"
                  },
                  "dns": {
                    "oneOf": [
                      {
                        "type": "array",
                        "maxItems": 0
                      },
                      {
                        "type": "array",
                        "minItems": 1,
                        "items": {
                          "type": "string",
                          "pattern": "^(?:(?:25[0-5]|2[0-4][0-9]|1?[0-9]{1,2})\\.){3}(?:25[0-5]|2[0-4][0-9]|1?[0-9]{1,2})$"
                        }
                      }
                    ]
                  },
                  "ntp_servers": {
                    "oneOf": [
                      {
                        "type": "array",
                        "maxItems": 0
                      },
                      {
                        "type": "array",
                        "minItems": 1,
                        "items": {
                          "type": "object",
                          "required": ["address", "type"],
                          "properties": {
                            "address": {
                              "type": "string",
                              "pattern": "^((?:(?:25[0-5]|2[0-4][0-9]|1?[0-9]{1,2})\\.){3}(?:25[0-5]|2[0-4][0-9]|1?[0-9]{1,2})|([a-zA-Z0-9-]+\\.)+[a-zA-Z]{2,})$"
                            },
                            "type": {
                              "type": "string",
                              "enum": ["server", "pool"]
                            }
                          },
                          "additionalProperties": false
                        }
                      }
                    ]
                  }
                },
                "additionalProperties": false
              }
            },
            "additionalProperties": false
          },
          {
            "type": "object",
            "required": ["ib_network"],
            "properties": {
              "ib_network": {
                "type": "object",
                "required": [
                  "subnet",
                  "netmask_bits"
                ],
                "properties": {
                  "subnet": {
                    "type": "string",
                    "pattern": "^(?:(?:25[0-5]|2[0-4][0-9]|1?[0-9]{1,2})\\.){3}(?:25[0-5]|2[0-4][0-9]|1?[0-9]{1,2})$"
                  },
                  "netmask_bits": {
                    "type": "string",
                    "pattern": "^(1[0-9]|2[0-9]|[1-9])$|^3[0-2]$"
                  }
                },
                "additionalProperties": false
              }
            },
            "additionalProperties": false
          }
        ]
      }
    }
  }
}


================================================
FILE: common/library/module_utils/input_validation/schema/omnia_config.json
================================================
{
  "title": "omnia_config.yaml",
  "description": "Omnia slurm and k8s config related parameters",
  "type": "object",
  "properties": {
    "slurm_cluster": {
      "type": "array",
      "description": "List of slurm cluster configurations.",
      "items": {
        "type": "object",
        "properties": {
          "cluster_name": { 
            "type": "string", 
            "minLength": 1,
            "description": "Unique name for the slurm cluster." 
          },
          "nfs_storage_name": { 
            "type": "string", 
            "minLength": 1,
            "description": "Name of the nfs storage in storage_config.yml" 
          },
          "skip_merge": { 
            "type": "boolean", 
            "description": "Variable indicates whether a specific configuration file path under config_sources should be used as-is without merging" 
          },
          "node_discovery_mode": {
            "type": "string",
            "enum": ["homogeneous", "heterogeneous"],
            "description": "Node hardware discovery mode. 'homogeneous' for group-based discovery, 'heterogeneous' for individual node discovery. Default: heterogeneous"
          },
          "node_hardware_defaults": {
            "type": "object",
            "description": "Hardware specifications for homogeneous node groups. Key is group name (grp0-grp100), value is hardware specs.",
            "patternProperties": {
              "^grp([0-9]|[1-9][0-9]|100)$": {
                "type": "object",
                "properties": {
                  "sockets": {
                    "type": "integer",
                    "minimum": 1,
                    "description": "Number of CPU sockets per node"
                  },
                  "cores_per_socket": {
                    "type": "integer",
                    "minimum": 1,
                    "description": "Number of CPU cores per socket"
                  },
                  "threads_per_core": {
                    "type": "integer",
                    "minimum": 1,
                    "description": "Number of CPU threads per core"
                  },
                  "real_memory": {
                    "type": "integer",
                    "minimum": 1,
                    "description": "Memory in MB (exact value to use in Slurm)"
                  },
                  "gres": {
                    "type": "string",
                    "pattern": "^gpu:[0-9]+$",
                    "description": "GPU resources in format 'gpu:N' (optional)"
                  }
                },
                "required": ["sockets", "cores_per_socket", "threads_per_core", "real_memory"],
                "additionalProperties": false
              }
            },
            "additionalProperties": false
          },
          "config_sources": {
            "type": "object",
            "description": "Config can be a file path or inline mapping",
            "additionalProperties": {
              "oneOf": [
                {
                  "type": "string",
                  "description": "File path string",
                  "pattern": "^/.+"
                },
                {
                  "type": "object",
                  "description": "Inline configuration mapping",
                  "additionalProperties": true
                }
              ]
            }
          }
        },
        "required": [
          "cluster_name",
          "nfs_storage_name"
        ]
      }
    },
    "service_k8s_cluster": {
      "type": "array",
      "description": "List of service Kubernetes cluster configurations.",
      "items": {
        "type": "object",
        "properties": {
          "cluster_name": { 
            "type": "string",
            "minLength": 1,
            "description": "Unique name for the service Kubernetes cluster." 
          },
          "deployment": {
            "type": "boolean"
          },
          "k8s_cni": {
            "enum": ["calico"],
            "description": "K8s CNI plugin to use for this cluster."
          },
          "pod_external_ip_range": { 
            "description": "Kubernetes pod network CIDR for internal network",
            "type":"string",
            "pattern":"^(?:(?:(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)\\.){3}(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)-(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?))|(?:(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)\\.){3}(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)/[0-9]{1,2}$|^$"
          },
          "k8s_service_addresses": {
            "type": "string",
            "pattern": "^(?:(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)\\.){3}(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)/[0-9]{1,2}$",
            "description": "CIDR for K8s service IPs."
          },
          "k8s_pod_network_cidr": {
            "type": "string",
            "pattern": "^(?:(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)\\.){3}(?:25[0-5]|2[0-4][0-9]|[01]?[0-9][0-9]?)/[0-9]{1,2}$",
            "description": "CIDR for K8s pod network."
          },
          "nfs_storage_name": {
            "type": "string",
            "description": "The NFS client server name mentioned in storage_config.yml"
          },
          "csi_powerscale_driver_secret_file_path": {
            "description": "Absolute file path for the secret.yaml file.",
            "type": "string",
            "pattern": "^(|/?([a-zA-Z0-9._-]+/)*[a-zA-Z0-9._-]+\\.yaml)$"
          },
          "csi_powerscale_driver_values_file_path": {
            "description": "File path for the values.yaml file.",
            "type": "string",
            "pattern": "^(|/?([a-zA-Z0-9._-]+/)*[a-zA-Z0-9._-]+\\.yaml)$"

          },
          "k8s_crio_storage_size": {
            "description": "Storage size for CRI-O in Gigabytes only (example: 10G, 15G, 100G)",
            "type": "string",
            "pattern": "^[1-9][0-9]*G$"
          }
        },
        "required": [
          "cluster_name",
          "k8s_cni",
          "k8s_service_addresses",
          "k8s_crio_storage_size"
        ],
        "allOf": [
        {
          "if": {
            "properties": {
              "csi_powerscale_driver_secret_file_path": {
                "type": "string",
                "minLength": 1
              }
            },
            "required": ["csi_powerscale_driver_secret_file_path"]
          },
          "then": {
            "required": ["csi_powerscale_driver_values_file_path"]
          }
        }
      ]
      }
    }
},
  "required": [
     "slurm_cluster",
     "service_k8s_cluster"
    ]
}


================================================
FILE: common/library/module_utils/input_validation/schema/provision_config.json
================================================
{
  "$schema": "http://json-schema.org/draft-07/schema#",
  "type": "object",
  "properties": {
    "pxe_mapping_file_path": {
      "type": "string",
      "description": "Path to the PXE mapping file."
    },
    "language": {
      "type": "string",
      "description": "Language setting.",
      "default": "en_US.UTF-8"
    },
    "default_lease_time": {
      "type": "string",
      "description": "Default lease time for DHCP.",
      "pattern": "^[0-9]+$",
      "default": "86400"
    }
  },
  "required": [
    "pxe_mapping_file_path",
    "language",
    "default_lease_time"
  ]
}


================================================
FILE: common/library/module_utils/input_validation/schema/security_config.json
================================================
{
  "$schema": "http://json-schema.org/draft-07/schema#",
  "title": "LDAP Configuration",
  "description": "Schema for LDAP configuration YAML file",
  "type": "object",
  "properties": {
    "ldap_connection_type": {
      "description": "LDAP connection type (TLS or SSL)",
      "type": "string"
    }
  },
  "required": [
    "ldap_connection_type"
  ]
}

================================================
FILE: common/library/module_utils/input_validation/schema/slurm_config_parameters.json
================================================
{
  "slurm.conf": {
    "AccountingStorageBackupHost": "S_P_STRING",
    "AccountingStorageEnforce": "S_P_STRING",
    "AccountingStorageExternalHost": "S_P_STRING",
    "AccountingStorageHost": "S_P_STRING",
    "AccountingStorageParameters": "S_P_STRING",
    "AccountingStoragePass": "S_P_STRING",
    "AccountingStoragePort": "S_P_UINT16",
    "AccountingStorageTRES": "S_P_STRING",
    "AccountingStorageType": "S_P_STRING",
    "AccountingStorageUser": "S_P_STRING",
    "AccountingStoreFlags": "S_P_STRING",
    "AccountingStoreJobComment": "S_P_BOOLEAN",
    "AcctGatherEnergyType": "S_P_STRING",
    "AcctGatherFilesystemType": "S_P_STRING",
    "AcctGatherInfinibandType": "S_P_STRING",
    "AcctGatherInterconnectType": "S_P_STRING",
    "AcctGatherNodeFreq": "S_P_UINT16",
    "AcctGatherProfileType": "S_P_STRING",
    "AllowSpecResourcesUsage": "S_P_BOOLEAN",
    "AuthAltParameters": "S_P_STRING",
    "AuthAltTypes": "S_P_STRING",
    "AuthInfo": "S_P_STRING",
    "AuthType": "S_P_STRING",
    "BackupAddr": "S_P_STRING",
    "BackupController": "S_P_STRING",
    "BatchStartTimeout": "S_P_UINT16",
    "BcastExclude": "S_P_STRING",
    "BcastParameters": "S_P_STRING",
    "BurstBufferParameters": "S_P_STRING",
    "BurstBufferType": "S_P_STRING",
    "CertgenType": "S_P_STRING",
    "CertgenParameters": "S_P_STRING",
    "CertmgrType": "S_P_STRING",
    "CertmgrParameters": "S_P_STRING",
    "CliFilterParameters": "S_P_STRING",
    "CliFilterPlugins": "S_P_STRING",
    "ClusterName": "S_P_STRING",
    "CommunicationParameters": "S_P_STRING",
    "CompleteWait": "S_P_UINT16",
    "ControlAddr": "S_P_STRING",
    "ControlMachine": "S_P_STRING",
    "CoreSpecPlugin": "S_P_STRING",
    "CpuFreqDef": "S_P_STRING",
    "CpuFreqGovernors": "S_P_STRING",
    "CredType": "S_P_STRING",
    "CryptoType": "S_P_STRING",
    "DataParserParameters": "S_P_STRING",
    "DebugFlags": "S_P_STRING",
    "DefCPUPerGPU": "S_P_UINT64",
    "DefMemPerCPU": "S_P_UINT64",
    "DefMemPerGPU": "S_P_UINT64",
    "DefMemPerNode": "S_P_UINT64",
    "DependencyParameters": "S_P_STRING",
    "DisableRootJobs": "S_P_BOOLEAN",
    "EioTimeout": "S_P_UINT16",
    "EnforcePartLimits": "S_P_STRING",
    "Epilog": "S_P_ARRAY",
    "EpilogMsgTime": "S_P_UINT32",
    "EpilogSlurmctld": "S_P_ARRAY",
    "EpilogTimeout": "S_P_UINT16",
    "ExtSensorsFreq": "S_P_UINT16",
    "ExtSensorsType": "S_P_STRING",
    "FairShareDampeningFactor": "S_P_UINT16",
    "FastSchedule": "S_P_UINT16",
    "FederationParameters": "S_P_STRING",
    "FirstJobId": "S_P_UINT32",
    "GetEnvTimeout": "S_P_UINT16",
    "GpuFreqDef": "S_P_STRING",
    "GresTypes": "S_P_STRING",
    "GroupUpdateForce": "S_P_UINT16",
    "GroupUpdateTime": "S_P_UINT16",
    "HashPlugin": "S_P_STRING",
    "HealthCheckInterval": "S_P_UINT16",
    "HealthCheckNodeState": "S_P_STRING",
    "HealthCheckProgram": "S_P_STRING",
    "HttpParserType": "S_P_STRING",
    "InactiveLimit": "S_P_UINT16",
    "InteractiveStepOptions": "S_P_STRING",
    "JobAcctGatherFrequency": "S_P_STRING",
    "JobAcctGatherParams": "S_P_STRING",
    "JobAcctGatherType": "S_P_STRING",
    "JobCompHost": "S_P_STRING",
    "JobCompLoc": "S_P_STRING",
    "JobCompParams": "S_P_STRING",
    "JobCompPass": "S_P_STRING",
    "JobCompPassScript": "S_P_STRING",
    "JobCompPort": "S_P_UINT32",
    "JobCompType": "S_P_STRING",
    "JobCompUser": "S_P_STRING",
    "JobContainerType": "S_P_STRING",
    "JobCredentialPrivateKey": "S_P_STRING",
    "JobCredentialPublicCertificate": "S_P_STRING",
    "JobFileAppend": "S_P_UINT16",
    "JobRequeue": "S_P_UINT16",
    "JobSubmitPlugins": "S_P_STRING",
    "KeepAliveTime": "S_P_UINT32",
    "KillOnBadExit": "S_P_UINT16",
    "KillWait": "S_P_UINT16",
    "LaunchParameters": "S_P_STRING",
    "LaunchType": "S_P_STRING",
    "Licenses": "S_P_STRING",
    "LogTimeFormat": "S_P_STRING",
    "MailDomain": "S_P_STRING",
    "MailProg": "S_P_STRING",
    "MaxArraySize": "S_P_UINT32",
    "MaxBatchRequeue": "S_P_UINT32",
    "MaxDBDMsgs": "S_P_UINT32",
    "MaxJobCount": "S_P_UINT32",
    "MaxJobId": "S_P_UINT32",
    "MaxMemPerCPU": "S_P_UINT64",
    "MaxMemPerNode": "S_P_UINT64",
    "MaxNodeCount": "S_P_UINT32",
    "MaxStepCount": "S_P_UINT32",
    "MaxTasksPerNode": "S_P_UINT16",
    "MCSParameters": "S_P_STRING",
    "MCSPlugin": "S_P_STRING",
    "MessageTimeout": "S_P_UINT16",
    "MetricsType": "S_P_STRING",
    "MinJobAge": "S_P_UINT32",
    "MpiDefault": "S_P_STRING",
    "MpiParams": "S_P_STRING",
    "NamespaceType": "S_P_STRING",
    "NodeFeaturesPlugins": "S_P_STRING",
    "OverTimeLimit": "S_P_UINT16",
    "PluginDir": "S_P_STRING",
    "PlugStackConfig": "S_P_STRING",
    "PowerParameters": "S_P_STRING",
    "PowerPlugin": "S_P_STRING",
    "PreemptExemptTime": "S_P_STRING",
    "PreemptMode": "S_P_STRING",
    "PreemptParameters": "S_P_STRING",
    "PreemptType": "S_P_STRING",
    "PrEpParameters": "S_P_STRING",
    "PrEpPlugins": "S_P_STRING",
    "PriorityCalcPeriod": "S_P_STRING",
    "PriorityDecayHalfLife": "S_P_STRING",
    "PriorityFavorSmall": "S_P_BOOLEAN",
    "PriorityFlags": "S_P_STRING",
    "PriorityMaxAge": "S_P_STRING",
    "PriorityParameters": "S_P_STRING",
    "PrioritySiteFactorParameters": "S_P_STRING",
    "PrioritySiteFactorPlugin": "S_P_STRING",
    "PriorityType": "S_P_STRING",
    "PriorityUsageResetPeriod": "S_P_STRING",
    "PriorityWeightAge": "S_P_UINT32",
    "PriorityWeightAssoc": "S_P_UINT32",
    "PriorityWeightFairshare": "S_P_UINT32",
    "PriorityWeightJobSize": "S_P_UINT32",
    "PriorityWeightPartition": "S_P_UINT32",
    "PriorityWeightQOS": "S_P_UINT32",
    "PriorityWeightTRES": "S_P_STRING",
    "PrivateData": "S_P_STRING",
    "ProctrackType": "S_P_STRING",
    "Prolog": "S_P_ARRAY",
    "PrologEpilogTimeout": "S_P_UINT16",
    "PrologFlags": "S_P_STRING",
    "PrologSlurmctld": "S_P_ARRAY",
    "PrologTimeout": "S_P_UINT16",
    "PropagatePrioProcess": "S_P_UINT16",
    "PropagateResourceLimits": "S_P_STRING",
    "PropagateResourceLimitsExcept": "S_P_STRING",
    "RebootProgram": "S_P_STRING",
    "ReconfigFlags": "S_P_STRING",
    "RequeueExit": "S_P_STRING",
    "RequeueExitHold": "S_P_STRING",
    "ResumeFailProgram": "S_P_STRING",
    "ResumeProgram": "S_P_STRING",
    "ResumeRate": "S_P_UINT16",
    "ResumeTimeout": "S_P_UINT16",
    "ResvEpilog": "S_P_STRING",
    "ResvOverRun": "S_P_UINT16",
    "ResvProlog": "S_P_STRING",
    "ReturnToService": "S_P_UINT16",
    "RoutePlugin": "S_P_STRING",
    "SallocDefaultCommand": "S_P_STRING",
    "SbcastParameters": "S_P_STRING",
    "SchedulerParameters": "S_P_STRING",
    "SchedulerTimeSlice": "S_P_UINT16",
    "SchedulerType": "S_P_STRING",
    "ScronParameters": "S_P_STRING",
    "SelectType": "S_P_STRING",
    "SelectTypeParameters": "S_P_STRING",
    "SlurmctldAddr": "S_P_STRING",
    "SlurmctldDebug": "S_P_STRING",
    "SlurmctldLogFile": "S_P_STRING",
    "SlurmctldParameters": "S_P_STRING",
    "SlurmctldPidFile": "S_P_STRING",
    "SlurmctldPort": "S_P_STRING",
    "SlurmctldPrimaryOffProg": "S_P_STRING",
    "SlurmctldPrimaryOnProg": "S_P_STRING",
    "SlurmctldSyslogDebug": "S_P_STRING",
    "SlurmctldTimeout": "S_P_UINT16",
    "SlurmdDebug": "S_P_STRING",
    "SlurmdLogFile": "S_P_STRING",
    "SlurmdParameters": "S_P_STRING",
    "SlurmdPidFile": "S_P_STRING",
    "SlurmdPort": "S_P_UINT32",
    "SlurmdSpoolDir": "S_P_STRING",
    "SlurmdSyslogDebug": "S_P_STRING",
    "SlurmdTimeout": "S_P_UINT16",
    "SlurmdUser": "S_P_STRING",
    "SlurmSchedLogFile": "S_P_STRING",
    "SlurmSchedLogLevel": "S_P_UINT16",
    "SlurmUser": "S_P_STRING",
    "SrunEpilog": "S_P_STRING",
    "SrunPortRange": "S_P_STRING",
    "SrunProlog": "S_P_STRING",
    "StateSaveLocation": "S_P_STRING",
    "SuspendExcNodes": "S_P_STRING",
    "SuspendExcParts": "S_P_STRING",
    "SuspendExcStates": "S_P_STRING",
    "SuspendProgram": "S_P_STRING",
    "SuspendRate": "S_P_UINT16",
    "SuspendTime": "S_P_STRING",
    "SuspendTimeout": "S_P_UINT16",
    "SwitchParameters": "S_P_STRING",
    "SwitchType": "S_P_STRING",
    "TaskEpilog": "S_P_STRING",
    "TaskPlugin": "S_P_STRING",
    "TaskPluginParam": "S_P_STRING",
    "TaskProlog": "S_P_STRING",
    "TCPTimeout": "S_P_UINT16",
    "TLSParameters": "S_P_STRING",
    "TLSType": "S_P_STRING",
    "TmpFS": "S_P_STRING",
    "TopologyParam": "S_P_STRING",
    "TopologyPlugin": "S_P_STRING",
    "TrackWCKey": "S_P_BOOLEAN",
    "TreeWidth": "S_P_UINT16",
    "UnkillableStepProgram": "S_P_STRING",
    "UnkillableStepTimeout": "S_P_UINT16",
    "UrlParserType": "S_P_STRING",
    "UsePAM": "S_P_BOOLEAN",
    "VSizeFactor": "S_P_UINT16",
    "WaitTime": "S_P_UINT16",
    "X11Parameters": "S_P_STRING",
    "DownNodes": "S_P_ARRAY",
    "NodeName": "S_P_ARRAY",
    "NodeSet": "S_P_ARRAY",
    "PartitionName": "S_P_ARRAY",
    "SlurmctldHost": "S_P_ARRAY"
  },
  "slurmdbd.conf": {
    "AllowNoDefAcct": "S_P_BOOLEAN",
    "AllResourcesAbsolute": "S_P_BOOLEAN",
    "ArchiveDir": "S_P_STRING",
    "ArchiveEvents": "S_P_BOOLEAN",
    "ArchiveJobs": "S_P_BOOLEAN",
    "ArchiveResvs": "S_P_BOOLEAN",
    "ArchiveScript": "S_P_STRING",
    "ArchiveSteps": "S_P_BOOLEAN",
    "ArchiveSuspend": "S_P_BOOLEAN",
    "ArchiveTXN": "S_P_BOOLEAN",
    "ArchiveUsage": "S_P_BOOLEAN",
    "AuthAltTypes": "S_P_STRING",
    "AuthAltParameters": "S_P_STRING",
    "AuthInfo": "S_P_STRING",
    "AuthType": "S_P_STRING",
    "CommitDelay": "S_P_UINT16",
    "CommunicationParameters": "S_P_STRING",
    "DbdAddr": "S_P_STRING",
    "DbdBackupHost": "S_P_STRING",
    "DbdHost": "S_P_STRING",
    "DbdPort": "S_P_UINT16",
    "DebugFlags": "S_P_STRING",
    "DebugLevel": "S_P_STRING",
    "DebugLevelSyslog": "S_P_STRING",
    "DefaultQOS": "S_P_STRING",
    "DisableCoordDBD": "S_P_BOOLEAN",
    "DisableArchiveCommands": "S_P_BOOLEAN",
    "HashPlugin": "S_P_STRING",
    "JobPurge": "S_P_UINT32",
    "LogFile": "S_P_STRING",
    "LogTimeFormat": "S_P_STRING",
    "MaxPurgeLimit": "S_P_UINT32",
    "MaxQueryTimeRange": "S_P_STRING",
    "MessageTimeout": "S_P_UINT16",
    "Parameters": "S_P_STRING",
    "PidFile": "S_P_STRING",
    "PluginDir": "S_P_STRING",
    "PrivateData": "S_P_STRING",
    "PurgeEventAfter": "S_P_STRING",
    "PurgeJobAfter": "S_P_STRING",
    "PurgeResvAfter": "S_P_STRING",
    "PurgeStepAfter": "S_P_STRING",
    "PurgeSuspendAfter": "S_P_STRING",
    "PurgeTXNAfter": "S_P_STRING",
    "PurgeUsageAfter": "S_P_STRING",
    "PurgeEventMonths": "S_P_UINT32",
    "PurgeJobMonths": "S_P_UINT32",
    "PurgeStepMonths": "S_P_UINT32",
    "PurgeSuspendMonths": "S_P_UINT32",
    "PurgeTXNMonths": "S_P_UINT32",
    "PurgeUsageMonths": "S_P_UINT32",
    "SlurmUser": "S_P_STRING",
    "StepPurge": "S_P_UINT32",
    "StorageBackupHost": "S_P_STRING",
    "StorageHost": "S_P_STRING",
    "StorageLoc": "S_P_STRING",
    "StorageParameters": "S_P_STRING",
    "StoragePass": "S_P_STRING",
    "StoragePassScript": "S_P_STRING",
    "StoragePort": "S_P_UINT16",
    "StorageType": "S_P_STRING",
    "StorageUser": "S_P_STRING",
    "TCPTimeout": "S_P_UINT16",
    "TLSParameters": "S_P_STRING",
    "TLSType": "S_P_STRING",
    "TrackWCKey": "S_P_BOOLEAN",
    "TrackSlurmctldDown": "S_P_BOOLEAN"
  },
  "cgroup.conf": {
    "CgroupAutomount": "S_P_BOOLEAN",
    "CgroupMountpoint": "S_P_STRING",
    "CgroupSlice": "S_P_STRING",
    "ConstrainCores": "S_P_BOOLEAN",
    "ConstrainRAMSpace": "S_P_BOOLEAN",
    "AllowedRAMSpace": "S_P_FLOAT",
    "MaxRAMPercent": "S_P_FLOAT",
    "MinRAMSpace": "S_P_UINT64",
    "ConstrainSwapSpace": "S_P_BOOLEAN",
    "AllowedSwapSpace": "S_P_FLOAT",
    "MaxSwapPercent": "S_P_FLOAT",
    "MemoryLimitEnforcement": "S_P_BOOLEAN",
    "MemoryLimitThreshold": "S_P_FLOAT",
    "ConstrainDevices": "S_P_BOOLEAN",
    "AllowedDevicesFile": "S_P_STRING",
    "MemorySwappiness": "S_P_UINT64",
    "CgroupPlugin": "S_P_STRING",
    "IgnoreSystemd": "S_P_BOOLEAN",
    "IgnoreSystemdOnFailure": "S_P_BOOLEAN",
    "EnableControllers": "S_P_BOOLEAN",
    "EnableExtraControllers": "S_P_STRING",
    "SignalChildrenProcesses": "S_P_BOOLEAN",
    "SystemdTimeout": "S_P_UINT64"
  },
  "gres.conf": {
    "AutoDetect": "S_P_STRING",
    "Count": "S_P_STRING",
    "CPUs": "S_P_STRING",
    "Cores": "S_P_STRING",
    "File": "S_P_STRING",
    "Files": "S_P_STRING",
    "Flags": "S_P_STRING",
    "Link": "S_P_STRING",
    "Links": "S_P_STRING",
    "MultipleFiles": "S_P_STRING",
    "Name": "S_P_STRING",
    "Type": "S_P_STRING"
  },
  "oci.conf": {
    "ContainerPath": "S_P_STRING",
    "CreateEnvFile": "S_P_STRING",
    "DisableHooks": "S_P_STRING",
    "EnvExclude": "S_P_STRING",
    "MountSpoolDir": "S_P_STRING",
    "RunTimeCreate": "S_P_STRING",
    "RunTimeDelete": "S_P_STRING",
    "RunTimeKill": "S_P_STRING",
    "RunTimeEnvExclude": "S_P_STRING",
    "RunTimeQuery": "S_P_STRING",
    "RunTimeRun": "S_P_STRING",
    "RunTimeStart": "S_P_STRING",
    "SrunPath": "S_P_STRING",
    "SrunArgs": "S_P_ARRAY",
    "DisableCleanup": "S_P_BOOLEAN",
    "StdIODebug": "S_P_STRING",
    "SyslogDebug": "S_P_STRING",
    "FileDebug": "S_P_STRING",
    "DebugFlags": "S_P_STRING",
    "IgnoreFileConfigJson": "S_P_BOOLEAN"
  },
  "acct_gather.conf": {
    "EnergyIPMIDriverType": "S_P_UINT32",
    "EnergyIPMIDisableAutoProbe": "S_P_UINT32",
    "EnergyIPMIDriverAddress": "S_P_UINT32",
    "EnergyIPMIRegisterSpacing": "S_P_UINT32",
    "EnergyIPMIDriverDevice": "S_P_STRING",
    "EnergyIPMIProtocolVersion": "S_P_UINT32",
    "EnergyIPMIUsername": "S_P_STRING",
    "EnergyIPMIPassword": "S_P_STRING",
    "EnergyIPMIPrivilegeLevel": "S_P_UINT32",
    "EnergyIPMIAuthenticationType": "S_P_UINT32",
    "EnergyIPMICipherSuiteId": "S_P_UINT32",
    "EnergyIPMISessionTimeout": "S_P_UINT32",
    "EnergyIPMIRetransmissionTimeout": "S_P_UINT32",
    "EnergyIPMIWorkaroundFlags": "S_P_UINT32",
    "EnergyIPMIRereadSdrCache": "S_P_BOOLEAN",
    "EnergyIPMIIgnoreNonInterpretableSensors": "S_P_BOOLEAN",
    "EnergyIPMIBridgeSensors": "S_P_BOOLEAN",
    "EnergyIPMIInterpretOemData": "S_P_BOOLEAN",
    "EnergyIPMISharedSensors": "S_P_BOOLEAN",
    "EnergyIPMIDiscreteReading": "S_P_BOOLEAN",
    "EnergyIPMIIgnoreScanningDisabled": "S_P_BOOLEAN",
    "EnergyIPMIAssumeBmcOwner": "S_P_BOOLEAN",
    "EnergyIPMIEntitySensorNames": "S_P_BOOLEAN",
    "EnergyIPMIFrequency": "S_P_UINT32",
    "EnergyIPMICalcAdjustment": "S_P_BOOLEAN",
    "EnergyIPMIPowerSensors": "S_P_STRING",
    "EnergyIPMITimeout": "S_P_UINT32",
    "EnergyIPMIVariable": "S_P_STRING",
    "ProfileHDF5Dir": "S_P_STRING",
    "ProfileHDF5Default": "S_P_STRING",
    "ProfileInfluxDBDatabase": "S_P_STRING",
    "ProfileInfluxDBDefault": "S_P_STRING",
    "ProfileInfluxDBFrequency": "S_P_UINT32",
    "ProfileInfluxDBHost": "S_P_STRING",
    "ProfileInfluxDBPass": "S_P_STRING",
    "ProfileInfluxDBRTPolicy": "S_P_STRING",
    "ProfileInfluxDBTimeout": "S_P_UINT32",
    "ProfileInfluxDBUser": "S_P_STRING",
    "InterconnectOFEDPort": "S_P_UINT32",
    "InfinibandOFEDPort": "S_P_UINT32",
    "SysfsInterfaces": "S_P_STRING"
  },
  "burst_buffer.conf": {
    "AllowUsers": "S_P_STRING",
    "CreateBuffer": "S_P_STRING",
    "DefaultPool": "S_P_STRING",
    "DenyUsers": "S_P_STRING",
    "DestroyBuffer": "S_P_STRING",
    "Directive": "S_P_STRING",
    "Flags": "S_P_STRING",
    "GetSysState": "S_P_STRING",
    "GetSysStatus": "S_P_STRING",
    "Granularity": "S_P_STRING",
    "OtherTimeout": "S_P_UINT32",
    "PollInterval": "S_P_UINT32",
    "Pools": "S_P_STRING",
    "StageInTimeout": "S_P_UINT32",
    "StageOutTimeout": "S_P_UINT32",
    "StartStageIn": "S_P_STRING",
    "StartStageOut": "S_P_STRING",
    "StopStageIn": "S_P_STRING",
    "StopStageOut": "S_P_STRING",
    "ValidateTimeout": "S_P_UINT32"
  },
  "helpers.conf": {
    "AllowUserBoot": "S_P_STRING",
    "BootTime": "S_P_UINT32",
    "ExecTime": "S_P_UINT32",
    "Feature": "S_P_ARRAY",
    "MutuallyExclusive": "S_P_LIST",
    "NodeName": "S_P_ARRAY"
  },
  "job_container.conf": {
    "AutoBasePath": "S_P_BOOLEAN",
    "BasePath": "S_P_ARRAY",
    "EntireStepInNS": "S_P_BOOLEAN",
    "InitScript": "S_P_STRING",
    "Shared": "S_P_BOOLEAN",
    "CloneNSScript": "S_P_STRING",
    "CloneNSEpilog": "S_P_STRING",
    "CloneNSScript_Wait": "S_P_UINT32",
    "CloneNSEpilog_Wait": "S_P_UINT32"
  },
  "mpi.conf": {
    "PMIxCliTmpDirBase": "S_P_STRING",
    "PMIxCollFence": "S_P_STRING",
    "PMIxDebug": "S_P_UINT32",
    "PMIxDirectConn": "S_P_BOOLEAN",
    "PMIxDirectConnEarly": "S_P_BOOLEAN",
    "PMIxDirectConnUCX": "S_P_BOOLEAN",
    "PMIxDirectSameArch": "S_P_BOOLEAN",
    "PMIxEnv": "S_P_STRING",
    "PMIxFenceBarrier": "S_P_BOOLEAN",
    "PMIxNetDevicesUCX": "S_P_STRING",
    "PMIxShareServerTopology": "S_P_BOOLEAN",
    "PMIxTimeout": "S_P_UINT32",
    "PMIxTlsUCX": "S_P_CSV"
  },
  "topology.conf": {
    "SwitchName": "S_P_ARRAY",
    "LinkSpeed": "S_P_UINT32",
    "Nodes": "S_P_STRING",
    "Switches": "S_P_STRING",
    "BlockName": "S_P_ARRAY",
    "BlockSizes": "S_P_STRING"
  },
  "type_definitions": {
    "S_P_IGNORE": "Any instance of specified key and associated value in a file will be allowed, but the value will not be stored",
    "S_P_STRING": "String value",
    "S_P_PLAIN_STRING": "Plain string value (not expanded in S_P_EXPLINE contexts)",
    "S_P_LONG": "Long integer value",
    "S_P_UINT16": "Unsigned 16-bit integer",
    "S_P_UINT32": "Unsigned 32-bit integer",
    "S_P_UINT64": "Unsigned 64-bit integer",
    "S_P_POINTER": "Pointer type (custom handler)",
    "S_P_ARRAY": "Array of values (allows multiple occurrences)",
    "S_P_LIST": "List of values (allows multiple occurrences)",
    "S_P_CSV": "Comma-separated values",
    "S_P_BOOLEAN": "Boolean value (true/false, yes/no)",
    "S_P_LINE": "Nested configuration line with sub-options",
    "S_P_EXPLINE": "Expanded line with hostlist expansion support",
    "S_P_FLOAT": "Floating point value",
    "S_P_DOUBLE": "Double precision floating point",
    "S_P_LONG_DOUBLE": "Long double precision floating point"
  }
}


================================================
FILE: common/library/module_utils/input_validation/schema/software_config.json
================================================
{
  "$schema": "http://json-schema.org/draft-07/schema#",
  "type": "object",
  "properties": {
    "cluster_os_type": {
      "type": "string",
      "enum": [ "rhel" ],
      "description": "Specifies the type of operating system for the cluster."
    },
    "cluster_os_version": {
      "type": "string",
      "description": "Specifies the version of the operating system for the cluster."
    },
    "repo_config": {
      "type": "string",
      "enum": ["always", "partial", "never"],
      "description": "Specifies how repository configurations are handled."
    },
    "softwares": {
      "type": "array",
      "items": {
        "type": "object",
        "properties": {
          "name": { "type": "string" },
          "version": { "type": "string" },
          "arch": {
            "type": "array",
            "items": {
              "type": "string",
              "enum": ["x86_64", "aarch64"]
            },
            "minItems": 1,
            "uniqueItems": true
          }
        },
        "required": ["name", "arch"],
        "additionalProperties": false
      },
      "description": "Array of software packages to be configured."
    },
    "additional_software": {
      "type": "array",
      "items": {
        "type": "object",
        "properties": {
          "name": { "type": "string" },
          "version": { "type": "string" }
        },
        "required": ["name"]
      },
      "description": "Array of additional software packages to be configured."
    },
    "bcm_roce": {
      "type": "array",
      "items": {
        "type": "object",
        "properties": {
          "name": { "type": "string" },
          "version": { "type": "string" }
        },
        "required": ["name"]
      },
      "description": "Array of BCM RoCE libraries."
    },
    "amdgpu": {
      "type": "array",
      "items": {
        "type": "object",
        "properties": {
          "name": { "type": "string" },
          "version": { "type": "string" }
        },
        "required": ["name"]
      },
      "description": "Array of AMDGPU software components."
    },
    "pytorch": {
      "type": "array",
      "items": {
        "type": "object",
        "properties": {
          "name": { "type": "string" }
        },
        "required": ["name"]
      },
      "description": "Array of PyTorch components."
    },
    "tensorflow": {
      "type": "array",
      "items": {
        "type": "object",
        "properties": {
          "name": { "type": "string" }
        },
        "required": ["name"]
      },
      "description": "Array of TensorFlow components."
    },
    "intelgaudi": {
      "type": "array",
      "items": {
        "type": "object",
        "properties": {
          "name": { "type": "string" }
        },
        "required": ["name"]
      },
      "description": "Array of Intel Gaudi components."
    }
  },
  "required": ["cluster_os_type", "cluster_os_version", "repo_config", "softwares"]
}


================================================
FILE: common/library/module_utils/input_validation/schema/storage_config.json
================================================
{
    "$schema": "http://json-schema.org/draft-07/schema#",
    "title": "Configuration Schema",
    "type": "object",
    "properties": {
      "nfs_client_params": {
        "type": "array",
        "items": {
          "type": "object",
          "properties": {
            "nfs_name": {
              "type": "string",
              "description": "The unique NFS server name"
            },
            "server_ip": {
              "type": "string",
              "anyOf": [
                {
                  "allOf": [
                    { "pattern": ".*[A-Za-z].*" },
                    { "format": "idn-hostname" }
                  ]
                },
                {
                  "allOf": [
                    { "pattern": "^[0-9.]+$" },
                    { "format": "ipv4" }
                  ]
                }
              ]
            },
            "server_share_path": {
              "type": "string",
              "pattern": "^/(?:[^/]+(?:/[^/]+)*)?/?$"
            },
            "client_share_path": {
              "type": "string",
              "pattern": "^/(?:[^/]+(?:/[^/]+)*)?/?$"
            },
            "client_mount_options": {
              "type": "string"
            }
          },
          "required": [
            "server_ip",
            "server_share_path",
            "client_share_path",
            "client_mount_options"
          ]
        },
        "minItems": 1
      },
      "powervault_config": {
        "type": "object",
        "required": ["ip", "iscsi_initiator", "volume_id"],
        "properties": {
          "ip": {
            "description": "List of target controller IP addresses",
            "type": "array",
            "minItems": 1,
            "items": {
              "type": "string",
              "format": "ipv4"
            },
            "uniqueItems": true
          },

          "port": {
            "description": "TCP port for iSCSI (default 3260)",
            "type": "integer"
          },

          "iscsi_initiator": {
            "description": "iSCSI initiator IQN",
            "type": "string",
            "pattern": "^iqn\\.[a-zA-Z0-9.-]+(?::[a-zA-Z0-9._:-]+)?$"
          },

          "volume_id": {
            "description": "Volume identifier (hex string)",
            "type": "string",
            "pattern": "^[a-fA-F0-9]+$"
          }
        }
      }
    },
    "required": [
      "nfs_client_params"
    ]
  }


================================================
FILE: common/library/module_utils/input_validation/schema/telemetry_config.json
================================================
{
  "$schema": "http://json-schema.org/draft-07/schema#",
  "title": "Telemetry Configuration",
  "type": "object",
  "properties": {
    "idrac_telemetry_support": {
      "type": "boolean"
    },
    "idrac_telemetry_collection_type": {
      "anyOf": [
        {
          "type": "string",
          "enum": ["kafka", "victoria"]
        },
        {
          "type": "string",
          "pattern": "(?i)^(kafka|victoria)(,(kafka|victoria))*$"
        }
      ]
    },
    "ldms_agg_port": {
      "type": "integer",
      "minimum": 6001,
      "maximum": 6100,
      "default": 6001,
      "description": "LDMS Aggregator port on service k8s cluster. Valid range: 6001-6100. Default: 6001"
    },
    "ldms_store_port": {
      "type": "integer",
      "minimum": 6001,
      "maximum": 6100,
      "default": 6001,
      "description": "LDMS store daemon port on service k8s cluster. Valid range: 6001-6100. Can be the same as ldms_agg_port (isolated by pod). Default: 6001"
    },
    "ldms_sampler_port": {
      "type": "integer",
      "minimum": 10001,
      "maximum": 10100,
      "default": 10001,
      "description": "LDMS sampler port on compute nodes. Valid range: 10001-10100. Default: 10001"
    },
    "ldms_sampler_configurations": {
      "anyOf": [
        {
          "type": "null",
          "description": "LDMS sampler configurations can be null if no LDMS monitoring is needed"
        },
        {
          "type": "array",
          "description": "LDMS-specific sampler configurations (string-based)",
          "items": {
            "type": "object",
            "properties": {
              "plugin_name": {
                "type": "string",
                "minLength": 1,
                "enum": [
                  "meminfo",
                  "procstat2",
                  "vmstat",
                  "loadavg",
                  "slurm_sampler",
                  "procnetdev2"
                ],
                "description": "Name of the LDMS sampler plugin. Must be one of the 6 supported plugin types: meminfo (memory usage), procstat2 (process statistics), vmstat (virtual memory), loadavg (system load), slurm_sampler (HPC workload monitoring), procnetdev2 (network interface statistics). Cannot be empty.",
                "errorMessage": {
                  "enum": "Invalid plugin_name. Only 6 plugins are supported: meminfo, procstat2, vmstat, loadavg, slurm_sampler, procnetdev2",
                  "minLength": "plugin_name cannot be empty. Must be one of: meminfo, procstat2, vmstat, loadavg, slurm_sampler, procnetdev2"
                }
              },
              "config_parameters": {
                "type": "string",
                "description": "Plugin-specific configuration parameters represented as a single string (e.g., 'component_id=2 stream=slurm job_count=8 task_count=8')"
              },
              "activation_parameters": {
                "type": "string",
                "description": "Activation parameters as a string (e.g., 'interval=1000000 offset=0'). Format: 'interval=<microseconds>' with optional 'offset=<microseconds>' separated by space.",
                "pattern": "^interval=[1-9][0-9]*(?:\\s+offset=[0-9]+)?$",
                "errorMessage": "Must be in format 'interval=<non-zero-number>' or 'interval=<non-zero-number> offset=<number>'. Example: 'interval=1000000' or 'interval=1000000 offset=0'"
              }
            },
            "required": ["plugin_name", "activation_parameters"],
            "allOf": [
              {
                "if": {
                  "properties": {
                    "plugin_name": { "const": "slurm_sampler" }
                  }
                },
                "then": {
                  "required": ["config_parameters"],
                  "properties": {
                    "config_parameters": {
                      "type": "string",
                      "pattern": "^(?=.*\\bcomponent_id=\\b)(?=.*\\bstream=\\b)(?=.*\\bjob_count=\\b)(?=.*\\btask_count=\\b).*$",
                      "description": "Must include component_id, stream, job_count, and task_count in the string"
                    }
                  }
                }
              },
              {
                "if": {
                  "properties": {
                    "plugin_name": {
                      "pattern": "^procnetdev[0-9]*$"
                    }
                  }
                },
                "then": {
                  "properties": {
                    "config_parameters": {
                      "type": "string",
                      "pattern": "^(|.*\\bifaces=[a-zA-Z0-9_,]+\\b.*)$",
                      "description": "Optional comma-separated list of network interfaces (e.g., 'ifaces=eth0,eth1')"
                    }
                  }
                }
              }
            ]
          }
        }
      ]
    }
  },
  "required": ["idrac_telemetry_support", "idrac_telemetry_collection_type", "ldms_sampler_configurations", "ldms_agg_port", "ldms_store_port", "ldms_sampler_port" ],
  "$defs": {
    "kafka_configurations": {
      "type": "object",
      "properties": {
        "persistence_size": {
          "type": "string",
          "pattern": "^[0-9]+(Ki|Mi|Gi|Ti|Pi|Ei)$"
        },
        "log_retention_hours": {
          "type": "integer",
          "minimum": 1
        },
        "log_retention_bytes": {
          "type": "integer"
        },
        "log_segment_bytes": {
          "type": "integer"
        },
        "topic_partitions": {
          "type": "array",
          "minItems": 1,
          "maxItems": 2,
          "items": {
            "type": "object",
            "properties": {
              "name": {
                "type": "string",
                "enum": ["idrac", "ldms"],
                "description": "CONSTANT: Fixed topic names that cannot be changed. Only 'idrac' and 'ldms' are allowed.",
                "errorMessage": {
                  "enum": "Invalid topic name. Only 'idrac' and 'ldms' are allowed as Kafka topic names. Custom topic names are not supported."
                }
              },
              "partitions": {
                "type": "integer",
                "minimum": 1,
                "maximum": 100,
                "description": "Number of partitions for the topic (1-100). This is the only configurable parameter."
              }
            },
            "required": ["name", "partitions"],
            "additionalProperties": false,
            "errorMessage": {
              "required": {
                "name": "Topic 'name' is required and must be one of: 'idrac', 'ldms'",
                "partitions": "Topic 'partitions' is required and must be between 1-100"
              }
            }
          },
          "uniqueItems": true,
          "description": "IMPORTANT: At least one Kafka topic must be defined. Topic names 'idrac' and 'ldms' are CONSTANTS. 'idrac' is required if idrac_telemetry_support is true and kafka is in idrac_telemetry_collection_type. 'ldms' is required if LDMS software is configured in software_config.json (automatic detection). Only partition counts can be changed.",
          "errorMessage": {
            "minItems": "At least 1 Kafka topic must be defined. Configure based on enabled features.",
            "maxItems": "Maximum 2 topics allowed: 'idrac' and 'ldms'",
            "uniqueItems": "Each topic (idrac, ldms) must appear only once"
          }
        }
      },
      "required": [
        "persistence_size",
        "log_retention_hours",
        "log_retention_bytes",
        "log_segment_bytes",
        "topic_partitions"
      ],
      "additionalProperties": false
    },
    "victoria_configurations": {
      "type": "object",
      "properties": {
        "deployment_mode": {
          "type": "string",
          "enum": ["single-node", "cluster"],
          "default": "cluster",
          "description": "VictoriaMetrics deployment mode. 'single-node' for simple deployment (1 pod), 'cluster' for high-availability deployment (7 pods). Default: 'cluster'",
          "errorMessage": {
            "enum": "deployment_mode must be either 'single-node' or 'cluster'"
          }
        },
        "persistence_size": {
          "type": "string",
          "pattern": "^[0-9]+(Ki|Mi|Gi|Ti|Pi|Ei)$"
        },
        "retention_period": {
          "type": "integer",
          "minimum": 24
        }
      },
      "required": [
        "deployment_mode",
        "persistence_size",
        "retention_period"
      ],
      "additionalProperties": false
    }
  },
  "allOf": [
    {
      "if": {
        "properties": {
            "idrac_telemetry_support": { "const": true },
            "idrac_telemetry_collection_type": { "pattern": "(?i)^kafka$" }
        }
      },
      "then": {
        "required": ["kafka_configurations"],
        "properties": {
            "kafka_configurations": { "$ref": "#/$defs/kafka_configurations" }
        }
      }
    },
    {
      "if": {
        "properties": {
          "idrac_telemetry_support": { "const": true },
          "idrac_telemetry_collection_type": { "pattern": "(?i)^victoria$" }
        }
      },
      "then": {
        "required": ["victoria_configurations"],
        "properties": {
          "victoria_configurations": { "$ref": "#/$defs/victoria_configurations" }
        }
      }
    },
    {
      "if": {
        "properties": {
          "idrac_telemetry_support": { "const": true },
          "idrac_telemetry_collection_type": {
            "pattern": "(?i)^(victoria,kafka|kafka,victoria)$"
          }
        }
      },
      "then": {
        "required": ["kafka_configurations", "victoria_configurations"],
        "properties": {
          "kafka_configurations": { "$ref": "#/$defs/kafka_configurations" },
          "victoria_configurations": { "$ref": "#/$defs/victoria_configurations" }
        }
      }
    }
  ]
}


================================================
FILE: common/library/module_utils/input_validation/validation_flows/__init__.py
================================================


================================================
FILE: common/library/module_utils/input_validation/validation_flows/build_stream_validation.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# pylint: disable=import-error,no-name-in-module,too-many-positional-arguments,too-many-arguments,unused-argument
"""
Validates build stream configuration files for Omnia.
"""
import ipaddress
import os
import socket
import ssl
import subprocess
from http import client
from ansible.module_utils.input_validation.common_utils import validation_utils
from ansible.module_utils.input_validation.common_utils import config
from ansible.module_utils.input_validation.common_utils import en_us_validation_msg as msg

file_names = config.files
create_error_msg = validation_utils.create_error_msg
create_file_path = validation_utils.create_file_path
load_yaml_as_json = validation_utils.load_yaml_as_json


def get_ethernet_interface_ips(logger):
    """
    Get all IPv4 addresses assigned to physical ethernet interfaces on the OIM.

    Uses /sys/class/net/ to identify physical ethernet interfaces
    (type=1, has 'device' symlink, not a bridge) and the `ip` command
    to retrieve all IPv4 addresses (including secondary addresses).

    Args:
        logger: Logger instance

    Returns:
        list: List of IPv4 address strings from ethernet interfaces
    """
    ethernet_ips = []
    net_dir = '/sys/class/net'

    try:
        if not os.path.isdir(net_dir):
            logger.warning("/sys/class/net directory not found")
            return ethernet_ips

        for iface in sorted(os.listdir(net_dir)):
            iface_path = os.path.join(net_dir, iface)

            # Check interface type: 1 = ARPHRD_ETHER (ethernet)
            type_file = os.path.join(iface_path, 'type')
            try:
                with open(type_file, 'r', encoding='utf-8') as f:
                    iface_type = int(f.read().strip())
            except (IOError, ValueError):
                continue
            if iface_type != 1:
                continue

            # Skip bridge interfaces (have a 'bridge' subdirectory)
            if os.path.isdir(os.path.join(iface_path, 'bridge')):
                continue

            # Skip virtual interfaces: physical NICs have a 'device' symlink
            if not os.path.exists(os.path.join(iface_path, 'device')):
                continue

            # Get all IPv4 addresses (primary + secondary) via ip command
            ip_result = subprocess.run(
                ['ip', '-4', '-o', 'addr', 'show', 'dev', iface],
                capture_output=True, text=True, timeout=10, check=False
            )
            if ip_result.returncode != 0:
                logger.debug("No IPv4 address on interface %s", iface)
                continue

            for line in ip_result.stdout.strip().split('\n'):
                if not line:
                    continue
                parts = line.split()
                for i, part in enumerate(parts):
                    if part == 'inet' and i + 1 < len(parts):
                        ip_addr = parts[i + 1].split('/')[0]
                        if ip_addr not in ethernet_ips:
                            ethernet_ips.append(ip_addr)

        logger.debug("Valid IPs found: %s", ethernet_ips)
    except OSError as e:
        logger.warning("Failed to get ethernet interface IPs: %s", str(e))
    return ethernet_ips

def validate_build_stream_config(input_file_path, data,
                                  logger, module, omnia_base_dir,
                                  module_utils_base, project_name):
    """
    Validates build stream configuration by checking enable_build_stream field,
    build_stream_host_ip, and aarch64_inventory_host_ip.
   
    Args:
        input_file_path (str): The path to the input file.
        data (dict): The data to be validated.
        logger (Logger): The logger object.
        module (AnsibleModule): The Ansible module object.
        omnia_base_dir (str): The base directory of Omnia.
        module_utils_base (str): The base directory of module_utils.
        project_name (str): The name of the project.

    Returns:
        list: A list of errors encountered during validation.
    """
    errors = []
    build_stream_yml = create_file_path(input_file_path, file_names["build_stream_config"])

    # Validate enable_build_stream
    enable_build_stream = data.get("enable_build_stream")
   
    if enable_build_stream is None:
        errors.append(create_error_msg(build_stream_yml, "enable_build_stream",
                                       msg.ENABLE_BUILD_STREAM_REQUIRED_MSG))
    elif not isinstance(enable_build_stream, bool):
        errors.append(create_error_msg(build_stream_yml, "enable_build_stream",
                                       msg.ENABLE_BUILD_STREAM_BOOLEAN_MSG))

    if errors or not enable_build_stream:
        return errors

    # Load network_spec.yml to get admin IP and netmask
    network_spec_path = create_file_path(input_file_path, file_names["network_spec"])
    network_spec_data = load_yaml_as_json(network_spec_path, omnia_base_dir, project_name, logger, module)
   
    if not network_spec_data:
        # If network_spec is not available, skip IP validations
        return errors
   
    # Extract admin network details
    admin_ip = None
    netmask_bits = None
   
    for network in network_spec_data.get("Networks", []):
        if "admin_network" in network:
            admin_network = network["admin_network"]
            admin_ip = admin_network.get("primary_oim_admin_ip")
            netmask_bits = admin_network.get("netmask_bits")
            break
   
    if not admin_ip or not netmask_bits:
        # Cannot validate without admin network info
        return errors

    # Validate build_stream_host_ip (mandatory field)
    build_stream_host_ip = data.get("build_stream_host_ip")

    if not build_stream_host_ip or build_stream_host_ip in ["", None]:
        errors.append(create_error_msg(build_stream_yml, "build_stream_host_ip",
                                       msg.BUILD_STREAM_HOST_IP_REQUIRED_MSG))
        return errors

    # Check if it's a valid IP format
    try:
        ipaddress.IPv4Address(build_stream_host_ip)
    except ValueError:
        errors.append(create_error_msg(build_stream_yml, "build_stream_host_ip",
                                       "Invalid IPv4 address format"))
        return errors

    # Validate that build_stream_host_ip matches an IP on an OIM ethernet interface
    # (i.e., it must be the OIM admin IP or OIM public IP)
    ethernet_ips = get_ethernet_interface_ips(logger)

    if not ethernet_ips:
        errors.append(create_error_msg(build_stream_yml, "build_stream_host_ip",
                                       msg.BUILD_STREAM_HOST_IP_NO_ETHERNET_IPS_MSG))
        return errors

    if build_stream_host_ip not in ethernet_ips:
        errors.append(create_error_msg(
            build_stream_yml, "build_stream_host_ip",
            msg.build_stream_host_ip_not_oim_ip_msg(build_stream_host_ip, ethernet_ips)
        ))

    # Validate aarch64_inventory_host_ip
    # Validate build_stream_port availability
    build_stream_port = data.get("build_stream_port")
    if build_stream_port:
        try:
            port_int = int(build_stream_port)
            if not (1 <= port_int <= 65535):
                raise ValueError
        except (TypeError, ValueError):
            errors.append(create_error_msg(
                build_stream_yml,
                "build_stream_port",
                msg.BUILD_STREAM_PORT_RANGE_MSG,
            ))
            return errors

        port_in_use = False
        try:
            with socket.create_connection((build_stream_host_ip, port_int), timeout=2):
                port_in_use = True
        except (OSError, ValueError):
            port_in_use = False

        if port_in_use:
            # Port is in use, check if it's build_stream by probing /health
            try:
                context = ssl._create_unverified_context()
                socket.setdefaulttimeout(2)
                conn = client.HTTPSConnection(build_stream_host_ip, port_int, timeout=2, context=context)
                conn.request("GET", "/health")
                resp = conn.getresponse()
                conn.close()
                if resp.status not in [200, 401, 403, 404, 500]:
                    raise ValueError(f"Unexpected HTTP status {resp.status}")            
            except Exception as exc:  # pylint: disable=broad-except
                errors.append(create_error_msg(
                    build_stream_yml,
                    "build_stream_port",
                    msg.BUILD_STREAM_PORT_INUSE_MSG.format(port=port_int, host_ip=build_stream_host_ip, detail=str(exc)),
                ))
            return errors

    # Validate aarch64_inventory_host_ip
    aarch64_inventory_host_ip = data.get("aarch64_inventory_host_ip")
    
    ### aarch64_inventory_host_ip check
    # Check if PXE mapping file contains aarch64 functional groups
    has_aarch64_groups = False
    try:
        pxe_mapping_path = os.path.join(omnia_base_dir, project_name, "pxe_mapping_file.csv")
        if os.path.exists(pxe_mapping_path):
            with open(pxe_mapping_path, 'r', encoding='utf-8') as f:
                # Skip header and check for aarch64 in functional group names
                for line in f:
                    if line.startswith('FUNCTIONAL_GROUP_NAME'):
                        continue
                    if 'aarch64' in line.lower():
                        has_aarch64_groups = True
                        break
        logger.debug("PXE mapping contains aarch64 groups: %s", has_aarch64_groups)
    except Exception as e:
        logger.warning("Failed to check PXE mapping file for aarch64 groups: %s", str(e))

    # If PXE mapping has aarch64 groups, require aarch64_inventory_host_ip
    if has_aarch64_groups:
        if not aarch64_inventory_host_ip or aarch64_inventory_host_ip in ["", None]:
            errors.append(create_error_msg(
                build_stream_yml, 
                "aarch64_inventory_host_ip",
                msg.AARCH64_INVENTORY_HOST_IP_REQUIRED_MSG
            ))
            return errors

    # If aarch64_inventory_host_ip is provided, validate it
    if aarch64_inventory_host_ip and aarch64_inventory_host_ip not in ["", None]:
        # Check if it's a valid IP format
        try:
            aarch64_ip = ipaddress.IPv4Address(aarch64_inventory_host_ip)
        except ValueError:
            errors.append(create_error_msg(build_stream_yml, "aarch64_inventory_host_ip",
                                          "Invalid IPv4 address format"))
            return errors

        # Check if it's in the same subnet as admin IP
        try:
            admin_network = ipaddress.IPv4Network(f"{admin_ip}/{netmask_bits}", strict=False)

            if aarch64_ip not in admin_network:
                errors.append(create_error_msg(
                    build_stream_yml,
                    "aarch64_inventory_host_ip",
                    msg.AARCH64_INVENTORY_HOST_IP_INVALID_SUBNET_MSG
                ))
        except ValueError as e:
            logger.error("Failed to validate subnet for aarch64_inventory_host_ip: %s", str(e))

        # Check aarch64 host IP reachability using socket (safer than subprocess)
        try:
            # Try to connect to SSH port which is usually open on inventory hosts
            ssh_port = 22  # SSH
            reachable = False
            
            try:
                with socket.create_connection((str(aarch64_ip), ssh_port), timeout=2):
                    reachable = True
                    logger.debug(f"aarch64 host {aarch64_ip} reachable on SSH port {ssh_port}")
            except (socket.timeout, socket.error, OSError):
                pass
            
            if not reachable:
                errors.append(create_error_msg(
                    build_stream_yml,
                    "aarch64_inventory_host_ip",
                    msg.AARCH64_INVENTORY_HOST_IP_NOT_REACHABLE_MSG.format(str(aarch64_ip))
                ))
        except Exception as e:
            logger.warning("Failed to check aarch64 host IP reachability: %s", str(e))
            errors.append(create_error_msg(
                build_stream_yml,
                "aarch64_inventory_host_ip",
                msg.AARCH64_INVENTORY_HOST_IP_REACHABILITY_CHECK_FAILED_MSG.format(str(aarch64_ip))
            ))

    # Validate build_stream_port
    build_stream_port = data.get("build_stream_port")

    if build_stream_port is not None:
        # Validate port range
        if not isinstance(build_stream_port, int) or not 1 <= build_stream_port <= 65535:
            errors.append(create_error_msg(
                build_stream_yml,
                "build_stream_port",
                "Port must be an integer between 1 and 65535"
            ))
        else:
            # Commenting out port availability check - temporarily disabled
            # Validate port availability (allows re-deployment with same port) - temporarily disabled
            # is_available, port_error = check_port_available(build_stream_port, admin_ip, logger)
            # if not is_available:
            #     errors.append(create_error_msg(
            #         build_stream_yml,
            #         "build_stream_port",
            #         port_error
            #     ))
            #     logger.error("Port %d is not available: %s", build_stream_port, port_error)
            pass


    return errors


================================================
FILE: common/library/module_utils/input_validation/validation_flows/common_validation.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# pylint: disable=import-error,no-name-in-module,too-many-arguments,unused-argument
# pylint: disable=too-many-locals,too-many-branches,too-many-statements,too-many-lines
# pylint: disable=too-many-positional-arguments,too-many-nested-blocks
"""
This module contains functions for validating common configuration files.
"""
import csv
import ipaddress
import json
import os
from collections import Counter

import yaml
import ansible.module_utils.input_validation.common_utils.data_fetch as fetch
from ansible.module_utils.input_validation.validation_flows import csi_driver_validation
import ansible.module_utils.input_validation.common_utils.data_validation as validate
from ansible.module_utils.input_validation.common_utils import (
    config,
    validation_utils,
    en_us_validation_msg,
    data_verification
)

from ansible.module_utils.local_repo.software_utils import (
    load_json,
    get_subgroup_dict,
    get_software_names,
    get_json_file_path
)
from ansible.module_utils.input_validation.common_utils.slurm_conf_utils import (
    parse_slurm_conf,
    validate_config_types
)

file_names = config.files
create_error_msg = validation_utils.create_error_msg
create_file_path = validation_utils.create_file_path
contains_software = validation_utils.contains_software
check_mandatory_fields = validation_utils.check_mandatory_fields
flatten_sub_groups = validation_utils.flatten_sub_groups
file_exists = data_verification.file_exists


def validate_software_config(
    input_file_path, data, logger, module, omnia_base_dir, module_utils_base, project_name
):
    """
    Validates the software configuration.

    Args:
        input_file_path (str): The path to the input file.
        data (dict): The data to be validated.
        logger (Logger): A logger instance.
        module (Module): A module instance.
        omnia_base_dir (str): The base directory of the Omnia configuration.
        module_utils_base (str): The base directory of the module utils.
        project_name (str): The name of the project.

    Returns:
        list: A list of errors encountered during validation.
    """
    errors = []
    software_config_file_path = create_file_path(
        input_file_path, file_names["software_config"])
    with open(software_config_file_path, "r", encoding="utf-8") as f:
        software_config_json = json.load(f)

    results=validate_versions(software_config_json)
    if results:   # means there are version mismatches
       errors.append(
          create_error_msg(
              software_config_file_path,
              "software version validation",
              f"Version mismatches found: {', '.join(results)}"
          )
       )
    cluster_os_type = data["cluster_os_type"]
    cluster_os_version = data["cluster_os_version"]
    os_version_ranges = config.os_version_ranges

    if cluster_os_type.lower() in os_version_ranges:
        version_range = os_version_ranges[cluster_os_type.lower()]
        if cluster_os_type.lower() in ["rhel", "rocky"]:
            if cluster_os_version not in version_range:
                errors.append(
                    create_error_msg(
                        "cluster_os_version",
                        cluster_os_version,
                        en_us_validation_msg.os_version_fail_msg(
                            cluster_os_type, ", ".join(version_range), None
                        ),
                    )
                )
        elif cluster_os_type.lower() == "ubuntu":
            if cluster_os_version not in version_range:
                errors.append(
                    create_error_msg(
                        "cluster_os_version",
                        cluster_os_version,
                        en_us_validation_msg.os_version_fail_msg(
                            cluster_os_type, version_range[0], version_range[1]
                        ),
                    )
                )

    #software groups and subgroups l2 validation
    # Check for the additional software field
    if "additional_software" in data:
        # Run schema validation and call validate_additional_software()
        schema_base_file_path = os.path.join(module_utils_base,'input_validation','schema')
        passwords_set = config.passwords_set
        extensions = config.extensions
        fname = "additional_software"
        schema_file_path = schema_base_file_path + "/" + fname + extensions['json']
        json_files = fetch.files_recursively(omnia_base_dir + "/" + project_name, extensions['json'])
        json_files_dic = {}

        for file_path in json_files:
            json_files_dic.update({fetch.file_name_from_path(file_path): file_path})
        new_file_path = json_files_dic.get("additional_software.json", None)

        # Validate the schema of the input file (L1)
        validation_status = {"Passed": [], "Failed": []}
        vstatus = []
        project_data = {project_name: {"status": [], "tag": "additional_software"}}
        validation_status.update(project_data)
        schema_status = validate.schema({
                            "input_file_path": new_file_path,
                            "schema_file_path": schema_file_path,
                            "passwords_set": passwords_set,
                            "omnia_base_dir": omnia_base_dir,
                            "project_name": project_name,
                            "logger": logger,
                            "module": module,
                        })
        vstatus.append(schema_status)

        # Append the validation status for the input file
        if schema_status:
            validation_status["Passed"].append(new_file_path)
        else:
            validation_status["Failed"].append(new_file_path)

        if False in vstatus:
            log_file_name = os.path.join(
                config.input_validator_log_path, f"validation_omnia_{project_name}.log")
            message = (f"Input validation failed for: {project_name} - additional_software.json"
               f"Look at the logs for more details: filename={log_file_name}")

            module.fail_json(
                msg=message,
                log_file_name=log_file_name,
                passed_files=validation_status["Passed"],
                failed_files=validation_status["Failed"]
            )

        # Check for the addtional_software.json file exist
        if new_file_path is None or not file_exists(new_file_path, module, logger):
            logger.info("The additional_software.json does not exist...")
            errors.append(
                create_error_msg(
                    "additional_software.json",
                    new_file_path,
                    en_us_validation_msg.MISSING_ADDITIONAL_SOFTWARE_JSON_FILE))
            return errors
        additional_software_data = None
        with open(json_files_dic["additional_software.json"], "r", encoding="utf-8") as schema_file:
            additional_software_data = json.load(schema_file)

        additional_software_errors = validate_additional_software(
            new_file_path, additional_software_data,
            logger, module, omnia_base_dir, module_utils_base, project_name)
        errors.extend(additional_software_errors)

    # create the subgroups and softwares dictionary with version details
    subgroup_dict, _ = get_subgroup_dict(data,logger)
    # check if the corresponding json files for softwares and subgroups exists in config folder
    validation_results = []
    failures = []
    fail_data = []

    # Ensure "default_packages" is present in software_config.json
    software_names = [pkg.get('name') for pkg in data.get('softwares', [])]
    if "default_packages" not in software_names:
        errors.append(
            create_error_msg(
                "Validation Error: ",
                "default_packages",
                "is mandatory in softwares_config.json but is missing."
            )
        )

    # Ensure software names are unique in ['softwares']
    sw_duplicates = [sw_name for sw_name, count in Counter(software_names).items() if count > 1]
    if sw_duplicates:
        errors.append(
            create_error_msg(
                "Validation Error: ",
                "Duplicate software names found:",
                f"{', '.join(sw_duplicates)}"
            )
        )

    # Ensure ldms is not configured without service_k8s in softwares
    if "ldms" in software_names and "service_k8s" not in software_names:
        errors.append(
            create_error_msg(
                "Validation Error: ",
                "ldms",
                en_us_validation_msg.LDMS_REQUIRES_SERVICE_K8S_MSG
            )
        )
    # Ensure ldms is not configured without a Slurm cluster package in softwares
    if "ldms" in software_names and not any(sw in software_names for sw in ["slurm_custom"]):
        errors.append(
            create_error_msg(
                "Validation Error: ",
                "ldms",
                en_us_validation_msg.LDMS_REQUIRES_SLURM_MSG
            )
        )

    # Check for required subgroups when specific software names are present
    software_requiring_subgroups = ["additional_packages", "slurm_custom", "service_k8s"]
    for software_name in software_requiring_subgroups:
        if software_name in software_names:
            if software_name not in data or not data[software_name]:
                errors.append(
                    create_error_msg(
                        "Validation Error: ",
                        software_name,
                        f"is present in softwares but corresponding subgroup '{software_name}' is missing or empty in software_config.json. Please refer examples directory for the correct format."
                    )
                )

    supported_subgroups = config.ADDITIONAL_PACKAGES_SUPPORTED_SUBGROUPS
    additional_packages_warnings = False

    for software_pkg in data['softwares']:
        software = software_pkg['name']
        arch_list = software_pkg.get('arch')
        for arch in arch_list:
            json_path = get_json_file_path(
                software, cluster_os_type, cluster_os_version, input_file_path, arch)
            # Check if json_path is None or if the JSON syntax is invalid
            if not json_path:
                errors.append(
                    create_error_msg(
                        "Validation Error: ", software,
                        f"is present in software_config.json. JSON file not found: {software}.json"
                    )
                )
            else:
                try:
                    subgroup_softwares = subgroup_dict.get(software, None)
                    json_data = load_json(json_path)
                    # For additional_packages, validate subgroup keys in the JSON
                    if software == "additional_packages":
                        if "additional_packages" not in json_data:
                            logger.warning(
                                f"{software}/{arch}: {json_path} - "
                                f"Required key 'additional_packages' is missing from the JSON file."
                            )
                            additional_packages_warnings = True
                        arch_supported = supported_subgroups.get(arch, [])
                        user_subgroups = [p.get('name') for p in data.get(software, [])]
                        for json_key in json_data:
                            if json_key == "additional_packages":
                                continue
                            if json_key not in arch_supported:
                                logger.warning(
                                    f"{software}/{arch}: {json_path} - "
                                    f"Subgroup '{json_key}' is not supported for architecture {arch}."
                                )
                                additional_packages_warnings = True
                            elif json_key not in user_subgroups:
                                logger.warning(
                                    f"{software}/{arch}: {json_path} - "
                                    f"Subgroup '{json_key}' is present in JSON but not listed under additional_packages in software_config.json."
                                )
                                additional_packages_warnings = True
                    for subgroup_software in subgroup_softwares:
                        # For additional_packages, skip subgroups that are
                        # not supported for this arch, or warn if supported but missing
                        if software == "additional_packages":
                            if subgroup_software not in supported_subgroups.get(arch, []):
                                continue
                            elif subgroup_software not in json_data:
                                logger.warning(
                                    f"{software}/{arch}: {json_path} - "
                                    f"Software {subgroup_software} not found in {software}.")
                                additional_packages_warnings = True
                                continue
                        _, fail_data = validation_utils.validate_softwaresubgroup_entries(
                            subgroup_software, json_path, json_data, validation_results, failures
                        )

                except (FileNotFoundError, json.JSONDecodeError) as e:
                    errors.append(
                        create_error_msg("Error opening or reading JSON file:", json_path, str(e))
                    )

    if fail_data:
        errors.append(
            create_error_msg(
                "Software config subgroup validation failed for",
                fail_data,
                "Please resolve the issues first before proceeding.",
            )
        )
    
    if additional_packages_warnings:
        logger.info(
            "[INFO] Additional packages validation completed with warnings. "
            "Please review the log file for additional_packages configuration details.")

    return errors

def is_version_valid(actual_version, expected):
    """Check if the actual version matches the expected version."""
    if isinstance(expected, list):
        return actual_version in expected
    return actual_version == expected

def validate_versions(data):
    """Validate software versions against expected versions."""
    mismatches = []
    # Validate top-level 'softwares'
    for sw in data.get("softwares", []):
        name = sw.get("name")
        version = sw.get("version")
        expected_version = config.expected_versions.get(name)

        if expected_version:
            if not version:
                mismatches.append(f"{name} is missing a version")
            elif not is_version_valid(version, expected_version):
                mismatches.append(f"{name} version mismatch: expected {expected_version}, got {version}")

    # Validate subgroup software (e.g. "amdgpu": [{...}])
    for parent_key, children in data.items():
        if parent_key == "softwares" or not isinstance(children, list):
            continue

        for sub_sw in children:
            name = sub_sw.get("name")
            version = sub_sw.get("version")
            expected_version = config.expected_versions.get(name)

            # Skip if version is not provided
            if expected_version and version:
                if not is_version_valid(version, expected_version):
                    mismatches.append(
                        f"{name} version mismatch in {parent_key}: expected {expected_version}, got {version}"
                    )

    return mismatches


def validate_openldap_input_params(authentication_type, mandatory_fields, data, errors, _logger):

    """
    Validates the input parameters for the OpenLDAP authentication.

    Args:
        authentication_type (str): Type of authentication.
        mandatory_fields (list): List of mandatory fields required for validation.
        data (dict): Input data containing the parameters to be validated.
        errors (list): List to store error messages.
        logger (object): Logger object for logging information.

    Notes:
        - The function checks if all mandatory fields are present in the input data.
        - It validates the `ldap_connection_type` field to ensure it is one of the supported types.
        - It also validates the certificate paths for TLS connections.
        - If any validation fails, an error message is appended to the `errors` list.

    Validation Rules:
        - All mandatory fields should be present in the input data.
        - The `ldap_connection_type` field should be one of the supported types
        (defined in `config.supported_ldap_connection_type`).
        - The certificate paths for TLS connections should be valid and existing files.

    Returns:
        None
    """

    check_mandatory_fields(mandatory_fields, data, errors)

    # validate ldap_connection_type
    ldap_connection_type = data.get("ldap_connection_type","").upper()
    if ldap_connection_type and ldap_connection_type not in config.supported_ldap_connection_type:
        errors.append(
            create_error_msg(authentication_type,
                            "software",
                            en_us_validation_msg.LDAP_CONNECTION_TYPE_FAIL_MSG)
        )

    certificates = {
        "tls_ca_certificate": data.get("tls_ca_certificate", ""),
        "tls_certificate": data.get("tls_certificate", ""),
        "tls_certificate_key": data.get("tls_certificate_key",""),
    }

    for cert_name, cert_value in certificates.items():
        if cert_value and not validation_utils.verify_path(cert_value):
            errors.append(
                create_error_msg(cert_name,
                                cert_value,
                                en_us_validation_msg.LDAP_CERT_PATH_FAIL_MSG)
            )

def validate_freeapi_input_params(authentication_type, mandatory_fields, data, errors, logger):

    """
    Validates the input parameters for the Free API.

    Args:
        authentication_type (str): Type of authentication.
        mandatory_fields (list): List of mandatory fields required for validation.
        data (dict): Input data containing the parameters to be validated.
        errors (list): List to store error messages.
        logger (object): Logger object for logging information.

    Notes:
        - The function checks if all mandatory fields are present in the input data.
        - It validates the `realm_name` field to ensure it contains a dot (`.`) character.
        - If any validation fails, an error message is appended to the `errors` list.

    Returns:
        None
    """

    check_mandatory_fields(mandatory_fields, data, errors)
    # validate realm_name
    realm_name = data.get("realm_name", "")
    if realm_name and "." not in realm_name:
        errors.append(
            create_error_msg("realm_name",
                            realm_name,
                            en_us_validation_msg.REALM_NAME_FAIL_MSG)
        )

def validate_security_config(
    input_file_path, data, logger, module, omnia_base_dir, module_utils_base, project_name
):
    """
    Validates the security configuration.

    Args:
        input_file_path (str): The path to the input file.
        data (dict): The data to be validated.
        logger (Logger): A logger instance.
        module (Module): A module instance.
        omnia_base_dir (str): The base directory of the Omnia configuration.
        module_utils_base (str): The base directory of the module utils.
        project_name (str): The name of the project.

    Returns:
        list: A list of errors encountered during validation.
    """
    errors = []
    software_config_json = create_file_path(
        input_file_path, file_names["software_config"]
    )
    software_list = get_software_names(software_config_json)
    authentication_type = ""
    required = {"openldap"}

    matches = [value for value in required if value in software_list]
    if matches:
        authentication_type = matches[0]
        logger.info(f"{authentication_type}: "
                    f"{en_us_validation_msg.AUTHENTICATION_SYSTEM_SUCCESS_MSG}")
    else:
        logger.warn(f"{en_us_validation_msg.AUTHENTICATION_SYSTEM_FAIL_MSG}")

    if authentication_type == "openldap":
        mandatory_fields = [
            "domain_name",
            "ldap_connection_type",
            "openldap_organization",
            "openldap_organizational_unit",
        ]
        validate_openldap_input_params(authentication_type, mandatory_fields, data, errors, logger)

    return errors


def validate_network_config(
    input_file_path, data, logger, module, omnia_base_dir, module_utils_base, project_name
):
    """
    Validates the network configuration.

    Args:
        input_file_path (str): The path to the input file.
        data (dict): The data to be validated.
        logger (Logger): A logger instance.
        module (Module): A module instance.
        omnia_base_dir (str): The base directory of the Omnia configuration.
        module_utils_base (str): The base directory of the module utils.
        project_name (str): The name of the project.

    Returns:
        list: A list of errors encountered during validation.
    """
    errors = []
    mlnx_ofed_offline_path = data["mlnx_ofed_offline_path"]
    if mlnx_ofed_offline_path and not validation_utils.verify_path(mlnx_ofed_offline_path):
        errors.append(
            create_error_msg(
                "mlnx_ofed_offline_path",
                mlnx_ofed_offline_path,
                en_us_validation_msg.FILE_PATH_FAIL_MSG,
            )
        )

    return errors

def get_matching_clusters_for_nfs(nfs_name, omnia_config):
    """
    Returns a dict of matching clusters for the given NFS name.
    """
    matching_clusters = {}

    # Service k8s
    for svc in omnia_config.get("service_k8s_cluster", []):
        if (
            svc.get("nfs_storage_name") == nfs_name
            and svc.get("deployment") is True
        ):
            matching_clusters["service_k8s_cluster"] = svc

    # Slurm
    for slurm in omnia_config.get("slurm_cluster", []):
        if slurm.get("nfs_storage_name") == nfs_name:
            matching_clusters["slurm_cluster"] = slurm

    return matching_clusters

def validate_storage_config(
    input_file_path, data, logger, module, omnia_base_dir, module_utils_base, project_name
):
    """
    Validates the storage configuration.

    Args:
        input_file_path (str): The path to the input file.
        data (dict): The data to be validated.
        logger (Logger): A logger instance.
        module (Module): A module instance.
        omnia_base_dir (str): The base directory of the Omnia configuration.
        module_utils_base (str): The base directory of the module utils.
        project_name (str): The name of the project.

    Returns:
        list: A list of errors encountered during validation.
    """
    errors = []
    software_config_file_path = create_file_path(input_file_path, file_names["software_config"])
    omnia_config_file_path = create_file_path(input_file_path, file_names["omnia_config"])

    # Read contents of omnia_config file in a variable
    _ = validation_utils.load_yaml_as_json(
        omnia_config_file_path, omnia_base_dir, project_name, logger, module
    )

    software_config_json = None
    with open(software_config_file_path, "r", encoding="utf-8") as schema_file:
        software_config_json = json.load(schema_file)
    _ = software_config_json["softwares"]

    allowed_options = {"nosuid", "rw", "sync", "hard", "intr"}

    for nfs_client_params in data["nfs_client_params"]:
        client_mount_options = nfs_client_params["client_mount_options"]
        client_mount_options_set = set(client_mount_options.split(","))

        if not (client_mount_options_set.issubset(allowed_options)):
            errors.append(
                create_error_msg(
                    "client_mount_options",
                    client_mount_options,
                    en_us_validation_msg.CLIENT_MOUNT_OPTIONS_FAIL_MSG,
                )
            )

        # nfs_strg_name = nfs_client_params["nfs_name"]
        # matching_clusters = get_matching_clusters_for_nfs(nfs_strg_name, omnia_config_json)

        # if not matching_clusters:
        #     errors.append(
        #         create_error_msg(
        #             "For the mentioned",
        #             nfs_strg_name,
        #             f"in storage_config.yml, no matching cluster found in omnia_config.yml "
        #             f"with deployment enabled for NFS '{nfs_strg_name}'."
        #         )
        #     )
    return errors


def validate_roce_plugin_config(
    input_file_path, data, logger, module, omnia_base_dir, module_utils_base, project_name
):
    """
    Validates the RoCE plugin configuration.

    Args:
        input_file_path (str): The path to the input file.
        data (dict): The data to be validated.
        logger (Logger): A logger instance.
        module (Module): A module instance.
        omnia_base_dir (str): The base directory of the Omnia configuration.
        module_utils_base (str): The base directory of the module utils.
        project_name (str): The name of the project.

    Returns:
        list: A list of errors encountered during validation.
    """
    errors = []
    return errors

def validate_allowed_services(data, errors, logger):

    """
    Validates the restrict_softwares field in the input data against a list of allowed services.

    Args:
        data (dict): The input data containing the restrict_softwares field.
        errors (list): A list to store error messages encountered during validation.
        logger (Logger): A logger instance for logging purposes.

    Returns:
        None

    Notes:
        The allowed services are: telnet, lpd, bluetooth, rlogin, and rexec.
        If a restrict_software is not in the allowed services list,
        an error message is appended to the errors list.

    Raises:
        None
    """
    restrict_program_support = data.get("restrict_program_support", False)
    if restrict_program_support:
        # validate allowed services
        allowed_services = ["telnet", "lpd", "bluetooth", "rlogin", "rexec"]
        restrict_softwares = data["restrict_softwares"].split(",")
        for software in restrict_softwares:
            if software not in allowed_services:
                errors.append(
                    create_error_msg(
                        "restrict_softwares",
                        data["restrict_softwares"],
                        en_us_validation_msg.restrict_softwares_fail_msg(software),
                    )
                )

def validate_alert_email_address(data, errors, logger):
    """
    Validates the alert email address provided in the input data.

    Args:
        data (dict): Input data containing the alert email address.
        errors (list): List to store error messages.
        logger (object): Logger object for logging warnings.

    Returns:
        list: List of validated alert email addresses.

    Notes:
        - If the alert email address is empty, a warning message is logged.
        - Each email address is checked for maximum length and presence of a search key.
        - Error messages are appended to the `errors` list for invalid email addresses.
    """
    alert_email_address = data.get("alert_email_address", "")
    alert_email_address_list = []

    if not alert_email_address:
        logger.warn(en_us_validation_msg.ALERT_EMAIL_WARNING_MSG)
    else:
        alert_email_address_list = alert_email_address.split(",")

    for email_id in alert_email_address_list:
        if len(email_id) > config.EMAIL_MAX_LENGTH or config.EMAIL_SEARCH_KEY not in email_id:
            errors.append(
                create_error_msg(
                    "email_id",
                    email_id,
                    en_us_validation_msg.ALERT_EMAIL_FAIL_MSG
                )
            )
    return alert_email_address_list

def validate_smtp_server(data, errors, logger):

    """
    Validates the SMTP server configuration provided in the input data.

    Args:
        data (dict): Input data containing the SMTP server configuration.
        errors (list): List to store error messages.
        logger (object): Logger object for logging information.

    Notes:
        - The function checks if the SMTP server configuration is a single, non-empty dictionary.
        - It verifies that the configuration contains the required fields:
        host, port, and sender address.
        - If the configuration is invalid or missing required fields,
        an error message is appended to the `errors` list.

    Returns:
        None
    """

    smtp_server = data.get("smtp_server","")
    logger.info(f"smpt server info info {smtp_server}")
    if len(smtp_server) != 1 or len(smtp_server) < 0:
        errors.append(
            create_error_msg(
                "smpt_server",
                smtp_server,
                en_us_validation_msg.SMTP_SERVER_FAIL_MSG
            )
        )

    if len(smtp_server) == 1:
        host = smtp_server[0].get("host","")
        port = smtp_server[0].get("port","")
        sender_address = smtp_server[0].get("sender_address","")

        if not host or not port or not sender_address:
            errors.append(
                create_error_msg(
                        "smpt_server",
                        smtp_server,
                        en_us_validation_msg.SMTP_SERVER_FAIL_MSG
                )
            )

def validate_login_node_security_config(
    input_file_path, data, logger, module, omnia_base_dir, module_utils_base, project_name
):
    """
    Validates the login node security configuration.

    Args:
        input_file_path (str): The path to the input file.
        data (dict): The data to be validated.
        logger (Logger): A logger instance.
        module (Module): A module instance.
        omnia_base_dir (str): The base directory of the Omnia configuration.
        module_utils_base (str): The base directory of the module utils.
        project_name (str): The name of the project.

    Returns:
        list: A list of errors encountered during validation.
    """
    errors = []

    software_config_json = create_file_path(
        input_file_path, file_names["software_config"]
    )

    software_list = get_software_names(software_config_json)

    enable_secure_login_node = False

    if "secure_login_node" in software_list:
        enable_secure_login_node = True

    if enable_secure_login_node:
        logger.info("secure_login_node is enabled")
        alert_email_address_list = validate_alert_email_address(data, errors, logger)
        if len(alert_email_address_list) > 0:
            validate_smtp_server(data, errors, logger)
        validate_allowed_services(data, errors, logger)
    return errors

def validate_server_spec(
    input_file_path, data, logger, module, omnia_base_dir, module_utils_base, project_name
):
    """
    Validates the server specification.

    Args:
        input_file_path (str): The path to the input file.
        data (dict): The data to be validated.
        logger (Logger): A logger instance.
        module (Module): A module instance.
        omnia_base_dir (str): The base directory of the Omnia configuration.
        module_utils_base (str): The base directory of the module utils.
        project_name (str): The name of the project.

    Returns:
        list: A list of errors encountered during validation.
    """
    errors = []
    server_groups = data["Categories"]
    server_spec_nicnetworks = []
    network_spec_networks = []

    # Early return if Categories are None or empty
    if server_groups is None:
        return errors

    network_spec_file_path = create_file_path(input_file_path, file_names["network_spec"])
    network_spec_json = validation_utils.load_yaml_as_json(
        network_spec_file_path, omnia_base_dir, project_name, logger, module
    )

    for server in server_groups:
        for _, value in server.items():
            for item in value:
                # Handle network specifications
                if "network" in item:
                    for network in item["network"]:
                        for network_key, network_value in network.items():
                            # Collecting the nicnetwork
                            server_spec_nicnetworks.append(network_value["nicnetwork"])
                            # Validating nicdevices if present
                            if "nicdevices" in network_value:
                                if not network_key.startswith(network_value.get("nicdevices")):
                                    errors.append(
                                        create_error_msg(
                                            f"{network_key}",
                                            None,
                                            en_us_validation_msg.server_spec_network_key_fail_msg(
                                                network_value["nicdevices"]
                                            ),
                                        )
                                    )

    # Collecting network_spec nicnetwork names
    for _, network in network_spec_json.items():
        for nw in network:
            for name, value in nw.items():
                network_spec_networks.append(name)

    # Validating that all server nicnetworks exist in network_spec.yml
    for item in server_spec_nicnetworks:
        if item not in network_spec_networks:
            errors.append(
                create_error_msg(
                    f'nicnetwork: "{item}"',
                    None,
                    en_us_validation_msg.SERVER_SPEC_NICNETWORKS_FAIL_MSG,
                )
            )

    return errors


def get_admin_networks(
    input_file_path, logger, module, omnia_base_dir, module_utils_base, project_name
):
    """
    Retrieves the admin network from the network specification.

    Args:
        input_file_path (str): The path to the input file.
        logger (Logger): A logger instance.
        module (Module): A module instance.
        omnia_base_dir (str): The base directory of the Omnia configuration.
        module_utils_base (str): The base directory of the module utils.
        project_name (str): The name of the project.

    Returns:
        dict: A dictionary containing the admin network.
    """
    network_spec_file_path = create_file_path(input_file_path, file_names["network_spec"])
    network_spec_json = validation_utils.load_yaml_as_json(
        network_spec_file_path, omnia_base_dir, project_name, logger, module
    )
    admin_networks = {}

    for network in network_spec_json["Networks"]:
        for key, value in network.items():
            if key in ["admin_network"]:
                dynamic_range = value.get("dynamic_range", "N/A")
                admin_networks[key] = {
                    "dynamic_range": dynamic_range,
                    "primary_oim_admin_ip": value.get("primary_oim_admin_ip")
                }
    return admin_networks

def is_ip_in_range(ip_str, ip_range_str):
    """
    Checks if the given IP address is inside the given IP range.
    The range format should be: "start_ip-end_ip"
    """
    try:
        ip = ipaddress.IPv4Address(ip_str)
        start_ip_str, end_ip_str = ip_range_str.strip().split("-")
        start_ip = ipaddress.IPv4Address(start_ip_str)
        end_ip = ipaddress.IPv4Address(end_ip_str)
        return start_ip <= ip <= end_ip
    except ValueError:
        return False


def validate_k8s(data, admin_networks, softwares, ha_config, tag_names, errors, 
                 st_config, module, input_file_path):
    """
    Validates Kubernetes cluster configurations.

    Parameters:
        data (dict): A dictionary containing Kubernetes cluster configurations.
        admin_networks (dict): A dictionary containing admin network information.
        softwares (list): A list of software name sin software_config.
        errors (list): A list to store error messages.
    """
    admin_dynamic_range = admin_networks["admin_network"]["dynamic_range"]
    primary_oim_admin_ip = admin_networks["admin_network"]["primary_oim_admin_ip"]

    # service_k8s_cluster = data["service_k8s_cluster"]
    cluster_set = {}

    if "service_k8s" in softwares and "service_k8s" in tag_names:
        cluster_set["service_k8s_cluster"] = data.get(
            "service_k8s_cluster", [])

    for k8s_cluster_type, k8s_clusters in cluster_set.items():
        deployments_list = [k.get('deployment', False) for k in k8s_clusters]
        true_count = deployments_list.count(True)

        if true_count > 1:
            errors.append(create_error_msg(
                f"{k8s_cluster_type} Multiple cluster", true_count,
                "There are multiple deployment values as True in the "
                "service_k8s_cluster and compute_k8s_cluster"))
        if not true_count:
            errors.append(create_error_msg(
                "No cluster deployment is true", true_count,
                "There should be atleast one cluster deployment set to True"))
        for kluster in k8s_clusters:
            cluster_name = kluster.get("cluster_name")
            deployment = kluster.get("deployment")
            if deployment:
                nfs_names = [st.get('nfs_name') for st in st_config.get('nfs_client_params')]
                k8s_nfs = kluster.get("nfs_storage_name")
                if not k8s_nfs:
                    errors.append(
                        create_error_msg(
                            f"Cluster - {cluster_name}",
                            "nfs_storage_name not provided",
                            f"nfs_storage_name not found in service_k8s_cluster {cluster_name}"
                        )
                    )
                if k8s_nfs not in nfs_names:
                    errors.append(
                        create_error_msg(
                            f"Cluster - {cluster_name} - nfs_storage_name not found",
                            k8s_nfs,
                            f"{k8s_nfs} not found in storage_config.yml"
                        ))
                if cluster_name not in ha_config.get(k8s_cluster_type+"_ha", []):
                    errors.append(
                        create_error_msg(
                            f"Cluster - {cluster_name} - not found in high_availability_config.yml",
                            cluster_name,
                            f"{cluster_name} not found in high_availability_config.yml"
                        ))
                pod_external_ip_range = kluster.get("pod_external_ip_range")
                if not pod_external_ip_range or str(pod_external_ip_range).strip() == "":
                    errors.append(
                        create_error_msg(
                            "Pod External IP Range -",
                            pod_external_ip_range,
                            f"For Cluster with name - {cluster_name} - "
                            "The pod external IP range is not provided in omnia_config.yml"))
                else:
                    does_overlap = is_ip_in_range(
                        primary_oim_admin_ip, pod_external_ip_range)
                    if does_overlap:
                        errors.append(
                            create_error_msg(
                                "Ip Overlap:",
                                does_overlap,
                                f"For Cluster with name - {cluster_name} - "
                                "The pod external IP range provided in omnia_config.yml overlaps "
                                "with the admin ip defined in network_spec.yml"))
                k8s_service_addresses = kluster.get("k8s_service_addresses")
                k8s_pod_network_cidr = kluster.get("k8s_pod_network_cidr")
                # k8s_offline_install = kluster.get("k8s_offline_install")
                ip_ranges = [
                    admin_dynamic_range,
                    k8s_service_addresses,
                    k8s_pod_network_cidr]
                does_overlap, _ = validation_utils.check_overlap(ip_ranges)
                if does_overlap:
                    errors.append(
                        create_error_msg(
                            "IP overlap -",
                            None,
                           en_us_validation_msg.IP_OVERLAP_FAIL_MSG))

                #csi validation
                if (
                      "csi_driver_powerscale" in softwares
                      and ("service_k8s" in softwares)
                    ):

                    csi_secret_file_path = kluster.get("csi_powerscale_driver_secret_file_path")
                    csi_values_file_path = kluster.get("csi_powerscale_driver_values_file_path")
                    
                    # Validate secret file path
                    if not csi_secret_file_path or \
                    not csi_secret_file_path.strip() or \
                    not os.path.exists(csi_secret_file_path.strip()):
                        errors.append(
                            create_error_msg(
                                "csi_powerscale_driver_secret_file_path",
                                csi_secret_file_path,
                                en_us_validation_msg.CSI_DRIVER_SECRET_FAIL_MSG,
                            )
                        )
                    else:
                        # If secret path is valid, ensure values path is also valid
                        if not csi_values_file_path or \
                        not csi_values_file_path.strip() or \
                        not os.path.exists(csi_values_file_path.strip()):
                            errors.append(
                                create_error_msg(
                                    "csi_powerscale_driver_values_file_path",
                                    csi_values_file_path,
                                    en_us_validation_msg.CSI_DRIVER_VALUES_FAIL_MSG,
                                )
                            )
                        csi_driver_validation.validate_powerscale_secret_and_values_file(csi_secret_file_path,csi_values_file_path, errors, input_file_path)

def validate_omnia_config(
        input_file_path,
        data,
        logger,
        module,
        omnia_base_dir,
        module_utils_base,
        project_name):
    """
    Validates the L2 logic of the omnia_config.yml file.

    Args:
        input_file_path (str): The path to the input file.
        data (dict): The data to be validated.
        logger (object): The logger to be used.
        module (object): The module to be used.
        omnia_base_dir (str): The base directory of Omnia.
        module_utils_base (str): The base directory of module_utils.
        project_name (str): The name of the project.

    Returns:
        list: A list of errors.
    """
    errors = []
    tag_names = module.params["tag_names"]

    software_config_file_path = create_file_path(
        input_file_path, file_names["software_config"])
    with open(software_config_file_path, "r", encoding="utf-8") as f:
        software_config_json = json.load(f)
    results=validate_versions(software_config_json)
    if results:   # means there are version mismatches
       errors.append(
          create_error_msg(
              software_config_file_path,
              "software version validation",
              f"Version mismatches found: {', '.join(results)}"
          )
       )
    softwares = software_config_json["softwares"]
    sw_list = [k['name'] for k in softwares]

    storage_config = create_file_path(
        input_file_path, file_names["storage_config"])
    with open(storage_config, "r", encoding="utf-8") as f:
        st_config = yaml.safe_load(f)

    if ("service_k8s" in sw_list) and \
        ("service_k8s" in tag_names):
        admin_networks = get_admin_networks(
            input_file_path, logger, module, omnia_base_dir, module_utils_base, project_name)
        ha_config_path = create_file_path(
            input_file_path, file_names["high_availability_config"])
        with open(ha_config_path, "r", encoding="utf-8") as f:
            ha_config = yaml.safe_load(f)
        for k in ["service_k8s_cluster_ha"]:
            ha_config[k] = [xha["cluster_name"] for xha in ha_config.get(k, [])]
        validate_k8s(data, admin_networks, sw_list, ha_config, tag_names,
                        errors, st_config, module, input_file_path)
    # slurm L2
    if (("slurm" in sw_list or "slurm_custom" in sw_list) and "slurm" in tag_names):     
        slurm_nfs = [clst.get('nfs_storage_name') for clst in data.get('slurm_cluster')]
        nfs_names = [st.get('nfs_name') for st in st_config.get('nfs_client_params')]

        diff_set = set(slurm_nfs).difference(set(nfs_names))
        if diff_set:
            errors.append(
                create_error_msg(
                    input_file_path,
                    "slurm NFS not provided",
                    f"NFS name {', '.join(diff_set)} required for slurm is not defined in {storage_config}"
                    ))
        
        # Validate node_hardware_defaults requires node_discovery_mode=homogeneous
        for clst in data.get('slurm_cluster', []):
            node_hardware_defaults = clst.get('node_hardware_defaults')
            node_discovery_mode = clst.get('node_discovery_mode')
            
            # Normalize mode to lowercase for case-insensitive comparison
            if node_discovery_mode and isinstance(node_discovery_mode, str):
                node_discovery_mode = node_discovery_mode.lower()
            
            if node_hardware_defaults and len(node_hardware_defaults) > 0:
                if not node_discovery_mode or node_discovery_mode != 'homogeneous':
                    group_names = list(node_hardware_defaults.keys())
                    errors.append(
                        create_error_msg(
                            input_file_path,
                            "slurm_cluster configuration inconsistency",
                            f"'node_hardware_defaults' is specified for groups {group_names}, but 'node_discovery_mode' is not set to 'homogeneous'. "
                            f"Current mode: {node_discovery_mode if node_discovery_mode else 'not set (defaults to heterogeneous)'}. "
                            f"Either set 'node_discovery_mode: \"homogeneous\"' to use the hardware specifications, "
                            f"or remove 'node_hardware_defaults' to use heterogeneous discovery."
                        ))
        
        cnfg_src = [clst.get('config_sources', {}) for clst in data.get('slurm_cluster')]
        skip_conf_validation = os.path.exists("/opt/omnia/input/.skip_slurm_conf_validation")
        cnfg_src = [clst.get('config_sources', {}) for clst in data.get('slurm_cluster')]
        skip_merge_list = [clst.get('skip_merge', False) for clst in data.get('slurm_cluster')]
        for idx, cfg_path_dict in enumerate(cnfg_src):
            skip_merge = skip_merge_list[idx]
            for k,v in cfg_path_dict.items():
                conf_dict = None
                if isinstance(v, str):
                    if not os.path.exists(v):
                        errors.append(
                            create_error_msg('omnia_config.yml', "slurm_cluster config_sources",
                                f"provided conf path for {k} - {v} does not exist"))
                        continue
                    else: # path exists
                        if not skip_merge and not skip_conf_validation:
                            conf_dict, duplicate_keys = parse_slurm_conf(v, k, False)
                            if duplicate_keys:
                                errors.append(
                                    create_error_msg('omnia_config.yml', "slurm_cluster->config_sources",
                                        f"duplicate keys found in {k}.conf - {','.join(duplicate_keys)}"))
                else:
                    conf_dict = v
                if conf_dict and not skip_conf_validation:
                    validation_result = validate_config_types(conf_dict, k, module)
                    if validation_result.get('type_errors'):
                        errors.extend(validation_result['type_errors'])
                    if validation_result.get('invalid_keys'):
                        errors.append(
                            create_error_msg('omnia_config.yml', "slurm_cluster->config_sources",
                                f"{k}.conf invalid keys found - {','.join(validation_result['invalid_keys'])}"))
    return errors

def check_is_service_cluster_functional_groups_defined(
    errors, input_file_path, omnia_base_dir, project_name, logger, module
):
    """
    Checks if 'service_kube_node_x86_64' is configured in the mapping file.

    Args:
        errors (list): A list to store error messages.
        input_file_path (str): The path to the input file.
        omnia_base_dir (str): The base directory for Omnia.
        project_name (str): The name of the project.
        logger (object): A logger object for logging messages.
        module (object): A module object for logging messages.

    Returns:
        True if 'service_kube_node_x86_64' is defined and valid in mapping file, else False
    """
    # Get the directory containing the input file
    input_dir = os.path.dirname(input_file_path)
    provision_config_path = os.path.join(input_dir, "provision_config.yml")
    
    # Check if provision_config.yml exists
    if not os.path.exists(provision_config_path):
        errors.append(
            create_error_msg(
                "provision_config.yml",
                provision_config_path,
                en_us_validation_msg.PROVISION_CONFIG_NOT_FOUND
            )
        )
        return False
    
    try:
        # Load provision_config.yml to get pxe_mapping_file_path
        with open(provision_config_path, 'r', encoding='utf-8') as f:
            provision_config = yaml.safe_load(f)
        
        pxe_mapping_file_path = provision_config.get('pxe_mapping_file_path', '')
        
        if not pxe_mapping_file_path or not os.path.exists(pxe_mapping_file_path):
            errors.append(
                create_error_msg(
                    "pxe_mapping_file_path",
                    pxe_mapping_file_path,
                    en_us_validation_msg.PXE_MAPPING_FILE_NOT_FOUND
                )
            )
            return False
        
        # Read the mapping file and check for service_kube_node functional groups
        with open(pxe_mapping_file_path, 'r', encoding='utf-8') as fh:
            raw_lines = fh.readlines()
        
        # Remove blank lines
        non_comment_lines = [ln for ln in raw_lines if ln.strip()]
        
        if not non_comment_lines:
            errors.append(
                create_error_msg(
                    "pxe_mapping_file_path",
                    pxe_mapping_file_path,
                    en_us_validation_msg.PXE_MAPPING_FILE_EMPTY_SERVICE_CLUSTER_MSG
                )
            )
            return False
        
        # Use csv.DictReader to parse the mapping file
        reader = csv.DictReader(non_comment_lines)
        
        # Check if all required service cluster functional groups are present
        # Required: service_kube_node_, service_kube_control_plane_
        has_kube_node = False
        has_control_plane = False
        
        for row in reader:
            functional_group = row.get('FUNCTIONAL_GROUP_NAME', '').strip()
            if functional_group.startswith('service_kube_node_'):
                has_kube_node = True
                logger.info(f"Service cluster functional group found: {functional_group}")
            elif functional_group.startswith('service_kube_control_plane_'):
                has_control_plane = True
                logger.info(f"Service cluster functional group found: {functional_group}")
        
        # Both must be present for a complete service cluster
        service_cluster_found = has_kube_node and has_control_plane
        
        if not service_cluster_found:
            missing = []
            if not has_kube_node:
                missing.append('service_kube_node_*')
            if not has_control_plane:
                missing.append('service_kube_control_plane_*')
            logger.info(f"Service cluster incomplete. Missing functional groups: {', '.join(missing)}")
        
        return service_cluster_found
        
    except (yaml.YAMLError, IOError, csv.Error) as e:
        errors.append(
            create_error_msg(
                "pxe_mapping_file_path",
                pxe_mapping_file_path if 'pxe_mapping_file_path' in locals() else "unknown",
                f"Error reading mapping file: {str(e)}"
            )
        )
        return False

def check_is_slurm_cluster_functional_groups_defined(
    errors, input_file_path, omnia_base_dir, project_name, logger, module
):
    """
    Checks if 'slurm_control_node_x86_64 and slurm_node' is configured in the mapping file.

    Args:
        errors (list): A list to store error messages.
        input_file_path (str): The path to the input file.
        omnia_base_dir (str): The base directory for Omnia.
        project_name (str): The name of the project.
        logger (object): A logger object for logging messages.
        module (object): A module object for logging messages.

    Returns:
        True if 'slurm_control_node_x86_64 and slurm_node' is defined in mapping file, else False
    """
    # Get the directory containing the input file
    input_dir = os.path.dirname(input_file_path)
    provision_config_path = os.path.join(input_dir, "provision_config.yml")
    
    # Check if provision_config.yml exists
    if not os.path.exists(provision_config_path):
        errors.append(
            create_error_msg(
                "provision_config.yml",
                provision_config_path,
                en_us_validation_msg.PROVISION_CONFIG_NOT_FOUND
            )
        )
        return False
    
    try:
        # Load provision_config.yml to get pxe_mapping_file_path
        with open(provision_config_path, 'r', encoding='utf-8') as f:
            provision_config = yaml.safe_load(f)
        
        pxe_mapping_file_path = provision_config.get('pxe_mapping_file_path', '')
        
        if not pxe_mapping_file_path or not os.path.exists(pxe_mapping_file_path):
            errors.append(
                create_error_msg(
                    "pxe_mapping_file_path",
                    pxe_mapping_file_path,
                    en_us_validation_msg.PXE_MAPPING_FILE_NOT_FOUND
                )
            )
            return False
        
        # Read the mapping file and check for slurm functional groups
        with open(pxe_mapping_file_path, 'r', encoding='utf-8') as fh:
            raw_lines = fh.readlines()
        
        # Remove blank lines
        non_comment_lines = [ln for ln in raw_lines if ln.strip()]
        
        if not non_comment_lines:
            errors.append(
                create_error_msg(
                    "pxe_mapping_file_path",
                    pxe_mapping_file_path,
                    en_us_validation_msg.PXE_MAPPING_FILE_EMPTY_SLURM_CLUSTER_MSG
                )
            )
            return False
        
        # Use csv.DictReader to parse the mapping file
        reader = csv.DictReader(non_comment_lines)
        
        # Check if all required slurm cluster functional groups are present
        # Required: slurm_control_node_, slurm_node
        has_slurm_control = False
        has_slurm_node = False
        
        for row in reader:
            functional_group = row.get('FUNCTIONAL_GROUP_NAME', '').strip()
            if functional_group.startswith('slurm_control_node_'):
                has_slurm_control = True
                logger.info(f"Slurm cluster functional group found: {functional_group}")
            elif functional_group.startswith('slurm_node_'):
                has_slurm_node = True
                logger.info(f"Slurm cluster functional group found: {functional_group}")
        
        # Both must be present for a complete slurm cluster
        slurm_cluster_found = has_slurm_control and has_slurm_node
        
        if not slurm_cluster_found:
            missing = []
            if not has_slurm_control:
                missing.append('slurm_control_node_')
            if not has_slurm_node:
                missing.append('slurm_node_')
            logger.info(f"Slurm cluster incomplete. Missing functional groups: {', '.join(missing)}")
        
        return slurm_cluster_found
        
    except (yaml.YAMLError, IOError, csv.Error) as e:
        errors.append(
            create_error_msg(
                "pxe_mapping_file_path",
                pxe_mapping_file_path if 'pxe_mapping_file_path' in locals() else "unknown",
                f"Error reading mapping file: {str(e)}"
            )
        )
        return False

def validate_telemetry_config(
    input_file_path,
    data,
    logger,
    module,
    omnia_base_dir,
    _module_utils_base,
    project_name
):

    """
    Validates the telemetry configuration data.

    This function checks the telemetry configuration data for validity and consistency.
    It verifies that the iDRAC telemetry support and federated iDRAC telemetry collection
    settings are correctly configured.

    Args:
        input_file_path (str): The path to the input file.
        data (dict): The telemetry configuration data.
        logger (object): The logger object.
        module (object): The module object.
        omnia_base_dir (str): The base directory of the Omnia project.
        _module_utils_base (str): The base directory of the module utilities.
        project_name (str): The name of the project.

    Returns:
        None

    Raises:
        None

    """
    errors = []

    idrac_telemetry_support = data.get("idrac_telemetry_support")
    is_service_cluster_defined = check_is_service_cluster_functional_groups_defined(errors,
                                input_file_path,
                                omnia_base_dir,
                                project_name,
                                logger,
                                module)
    if idrac_telemetry_support and not is_service_cluster_defined:
        errors.append(create_error_msg(
            "idrac_telemetry_support can be",
            idrac_telemetry_support,
            en_us_validation_msg.TELEMETRY_SERVICE_CLUSTER_ENTRY_MISSING_ROLES_CONFIG_MSG
            )    
        )

    is_slurm_cluster_defined = check_is_slurm_cluster_functional_groups_defined(errors,
                                input_file_path,
                                omnia_base_dir,
                                project_name,
                                logger,
                                module)
    
    # Determine LDMS support from software_config.json
    # software_config.json is in the same directory as telemetry_config.yml
    ldms_support_from_software_config = False
    input_dir = os.path.dirname(input_file_path)
    software_config_file_path = os.path.join(input_dir, "software_config.json")
    
    logger.info(f"Checking for LDMS software in: {software_config_file_path}")
    
    if os.path.exists(software_config_file_path):
        try:
            with open(software_config_file_path, 'r', encoding='utf-8') as f:
                software_config = json.load(f)
                softwares = software_config.get("softwares", [])
                ldms_support_from_software_config = any(
                    software.get("name") == "ldms" for software in softwares
                )
                logger.info(f"LDMS software detected in software_config.json: {ldms_support_from_software_config}")
                if ldms_support_from_software_config:
                    logger.info("LDMS software found - 'ldms' topic will be required in kafka_configurations.topic_partitions")
        except (json.JSONDecodeError, IOError) as e:
            logger.warn(f"Could not load software_config.json: {e}")
    else:
        logger.info(f"software_config.json not found at: {software_config_file_path}")

    if ldms_support_from_software_config and not (is_service_cluster_defined and is_slurm_cluster_defined):
        errors.append(create_error_msg(
            "LDMS entry in software_config.json set to ",
            ldms_support_from_software_config,
            en_us_validation_msg.TELEMETRY_SERVICE_CLUSTER_ENTRY_FOR_LDMS_MISSING_ROLES_CONFIG_MSG
            )
        )
    
    # Validate topic_partitions configuration
    kafka_config = data.get("kafka_configurations", {})
    topic_partitions = kafka_config.get("topic_partitions", [])
    idrac_telemetry_collection_type = data.get("idrac_telemetry_collection_type", "")
    
    # Check if LDMS software is configured but kafka_configurations is missing entirely
    if ldms_support_from_software_config and not kafka_config:
        errors.append(create_error_msg(
            "kafka_configurations",
            "not defined",
            "LDMS software is configured in software_config.json, but kafka_configurations section is missing in telemetry_config.yml. "
            "Please define kafka_configurations with at least the 'ldms' topic in topic_partitions."
        ))
    
    # Check if LDMS software is configured but no topics are defined
    if ldms_support_from_software_config and kafka_config and not topic_partitions:
        errors.append(create_error_msg(
            "kafka_configurations.topic_partitions",
            "not defined",
            "LDMS software is configured in software_config.json, but kafka_configurations.topic_partitions is not defined. "
            "Please define at least the 'ldms' topic in topic_partitions."
        ))
    
    if topic_partitions:
        # Ensure at least one topic is defined
        if len(topic_partitions) < 1:
            errors.append(create_error_msg(
                "kafka_configurations.topic_partitions",
                "is empty",
                "At least one Kafka topic must be defined"
            ))
        
        # Collect topic names and validate each one
        topic_names = []
        allowed_topics = {"idrac", "ldms"}
        
        for idx, topic in enumerate(topic_partitions):
            if "name" not in topic:
                errors.append(create_error_msg(
                    f"kafka_configurations.topic_partitions[{idx}]",
                    "missing 'name' field",
                    "Each topic must have a 'name' field"
                ))
                continue
            
            topic_name = topic.get("name")
            topic_names.append(topic_name)
            
            # Validate each topic name individually
            if topic_name not in allowed_topics:
                errors.append(create_error_msg(
                    f"kafka_configurations.topic_partitions[{idx}].name",
                    topic_name,
                    f"Invalid topic name '{topic_name}'. Only 'idrac' and 'ldms' are allowed as Kafka topic names. Custom topic names are not supported."
                ))
        
        present_topics = set(topic_names)
        
        # Debug logging
        logger.info(f"Telemetry validation - Present topics: {present_topics}")
        logger.info(f"Telemetry validation - Allowed topics: {allowed_topics}")
        
        # Validate required topics based on feature flags
        # If iDRAC telemetry is enabled with Kafka, idrac topic is required
        if idrac_telemetry_support and 'kafka' in idrac_telemetry_collection_type.split(','):
            if 'idrac' not in present_topics:
                errors.append(create_error_msg(
                    "kafka_configurations.topic_partitions",
                    "missing 'idrac' topic",
                    "idrac topic is required when idrac_telemetry_support is true and 'kafka' is in idrac_telemetry_collection_type"
                ))

        # If LDMS software is configured in software_config.json, ldms topic is required
        logger.info(f"Checking LDMS topic requirement - ldms_support_from_software_config: {ldms_support_from_software_config}")
        if ldms_support_from_software_config and 'ldms' not in present_topics:
            logger.error(f"LDMS topic validation FAILED - 'ldms' topic is missing from present_topics: {present_topics}")
            errors.append(create_error_msg(
                "kafka_configurations.topic_partitions",
                "missing 'ldms' topic",
                "ldms topic is required when LDMS software is configured in software_config.json"
            ))
        elif ldms_support_from_software_config:
            logger.info(f"LDMS topic validation PASSED - 'ldms' found in present_topics: {present_topics}")
        
        # Check for duplicate topic names
        if len(topic_names) != len(set(topic_names)):
            duplicates = [name for name in topic_names if topic_names.count(name) > 1]
            errors.append(create_error_msg(
                "kafka_configurations.topic_partitions",
                f"duplicate topics: {', '.join(set(duplicates))}",
                "Each topic must be defined only once"
            ))

    # Validate ldms_sampler_configurations - fail if it's None or empty array
    ldms_sampler_configurations = data.get("ldms_sampler_configurations")

    # Fail if ldms_sampler_configurations is None
    if ldms_sampler_configurations is None:
        errors.append(create_error_msg(
            "ldms_sampler_configurations",
            "null/None",
            "ldms_sampler_configurations is required and cannot be null. Please provide valid sampler configurations with plugin names."
        ))
    # Fail if ldms_sampler_configurations is an empty array
    elif isinstance(ldms_sampler_configurations, list):
        if len(ldms_sampler_configurations) == 0:
            errors.append(create_error_msg(
                "ldms_sampler_configurations",
                "empty array []",
                "ldms_sampler_configurations cannot be an empty array. Please provide at least one valid sampler configuration with plugin names."
            ))
        else:
            # Validate each sampler configuration for empty plugin_name
            for idx, config in enumerate(ldms_sampler_configurations):
                if not isinstance(config, dict):
                    continue

                plugin_name = config.get("plugin_name", "")
                if not plugin_name or (isinstance(plugin_name, str) and plugin_name.strip() == ""):
                    errors.append(create_error_msg(
                        f"ldms_sampler_configurations[{idx}].plugin_name",
                        f"'{plugin_name}'",
                        "plugin_name cannot be empty. Must be one of: meminfo, procstat2, vmstat, loadavg, slurm_sampler, procnetdev2"
                    ))
    
    return errors

def validate_additional_software(
    input_file_path, data, logger, module, omnia_base_dir, module_utils_base, project_name
):
    """
    Validates the additional software configuration.

    Args:
        input_file_path (str): The path to the input file.
        data (dict): The data to be validated.
        logger (Logger): A logger instance.
        module (Module): A module instance.
        omnia_base_dir (str): The base directory of the Omnia configuration.
        module_utils_base (str): The base directory of the module utils.
        project_name (str): The name of the project.

    Returns:
        list: A list of errors encountered during validation.

    """
    errors = []
    # Get all keys in the data
    raw_subgroups = list(data.keys())
    flattened_sub_groups = set(flatten_sub_groups(list(data.keys())))

    # Check if additional_software is not given in the config
    if "additional_software" not in flattened_sub_groups:
        errors.append(
            create_error_msg(
                "additional_software.json",
                None,
                en_us_validation_msg.ADDITIONAL_SOFTWARE_FAIL_MSG
            )
        )
        return errors

    # Get the roles config file
    config_file_path = omnia_base_dir.replace("../", "")
    roles_config_file_path = create_file_path(
        config_file_path, file_names["roles_config"]
    )

    roles_config_json = validation_utils.load_yaml_as_json(
        roles_config_file_path, omnia_base_dir, project_name, logger, module
    )
    valid_roles = roles_config_json["Roles"]

    # Set of unique role names
    available_roles_and_groups = set(role["name"] for role in roles_config_json["Roles"])
    available_roles_and_groups.add("additional_software")

    # Add the set of all unique group names
    available_roles_and_groups.update(group for role in valid_roles for group in role["groups"])

    # Check if a role or group name is present in the roles config file
    for sub_group in flattened_sub_groups:
        if sub_group not in available_roles_and_groups:
            errors.append(
                create_error_msg(
                    "additional_software.json",
                    None,
                    en_us_validation_msg.ADDITIONAL_SOFTWARE_SUBGROUP_FAIL_MSG.format(sub_group),
                )
            )

    # Validate subgroups defined for additional_software in software_config.json
    # also present in additioanl_software.json
    software_config_file_path = create_file_path(
        config_file_path, file_names["software_config"]
    )
    with open(software_config_file_path, "r", encoding="utf-8") as f:
        software_config_json = json.load(f)

    # check if additional_software is present in software_config.json
    if "addtional_software" not in software_config_json:
        logger.warn("The additional_software field is not present in software_config.json")
        software_config_json["additional_software"] = []

    sub_groups_in_software_config = list(
        sub_group["name"] for sub_group in software_config_json["additional_software"]
    )

    # Check for the additional_software key in software_config.json
    for sub_group in sub_groups_in_software_config:
        if sub_group not in raw_subgroups:
            errors.append(
                create_error_msg(
                    "software_config.json",
                    None,
                    en_us_validation_msg.MISSING_IN_ADDITIONAL_SOFTWARE_MSG.format(sub_group),
                )
            )
    return errors


================================================
FILE: common/library/module_utils/input_validation/validation_flows/csi_driver_validation.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# pylint: disable=import-error,no-name-in-module,too-many-positional-arguments,too-many-arguments,unused-argument
"""
Validates csi  driver configuration files for Omnia.
"""
import os
import yaml
from pathlib import Path
from ansible.module_utils.input_validation.common_utils import validation_utils
from ansible.module_utils.input_validation.common_utils import config

file_names = config.files
create_error_msg = validation_utils.create_error_msg
create_file_path = validation_utils.create_file_path
contains_software = validation_utils.contains_software
check_mandatory_fields = validation_utils.check_mandatory_fields
flatten_sub_groups = validation_utils.flatten_sub_groups


def validate_secret_isilon_clusters(data):
    """
    Validates csi secret file inputs for Omnia.
    """

    cluster_errors = []
    clusters = data.get("isilonClusters")

    # Check if isilonClusters is a defined, non-empty list
    if not isinstance(clusters, list) or len(clusters) == 0:
        cluster_errors.append("isilonClusters must be a non-empty list.")
        return cluster_errors  # Stop further checks

    for idx, item in enumerate(clusters):
        cluster_prefix = f"Cluster {idx + 1}"

        # Validate clusterName
        if not isinstance(item.get("clusterName"), str) or not item["clusterName"].strip():
            cluster_errors.append(f"{cluster_prefix}: Invalid or missing 'clusterName'.")

        # Validate username
        if not isinstance(item.get("username"), str) or not item["username"].strip():
            cluster_errors.append(f"{cluster_prefix}: Invalid or missing 'username'.")

        # Validate password
        if not isinstance(item.get("password"), str) or not item["password"].strip():
            cluster_errors.append(f"{cluster_prefix}: Invalid or missing 'password'.")

        # Validate endpoint
        if not isinstance(item.get("endpoint"), str) or not item["endpoint"].strip():
            cluster_errors.append(f"{cluster_prefix}: Invalid or missing 'endpoint'.")

        # Validate endpointPort if defined
        if "endpointPort" in item:
            if not isinstance(item["endpointPort"], int) or not 0 < item["endpointPort"] < 65536:
                cluster_errors.append(
                    f"{cluster_prefix}: 'endpointPort' must be an integer between 1 and 65535.")

        # Validate isDefault
        if "isDefault" not in item or not isinstance(item["isDefault"], bool):
            cluster_errors.append(
                f"{cluster_prefix}: 'isDefault' must be a boolean and must be defined.")

        # Validate skipCertificateValidation if defined
        if "skipCertificateValidation" in item:
            if item["skipCertificateValidation"] is not True:
                cluster_errors.append(
                    f"{cluster_prefix}: 'skipCertificateValidation' must be true if defined.")

        # Validate isiPath if defined
        if "isiPath" in item:
            isi_path = item["isiPath"]
            if (
                not isinstance(isi_path, str) or
                not isi_path.strip() or
                not isi_path.lstrip().startswith('/')
            ):
                cluster_errors.append(
                    f"{cluster_prefix}: 'isiPath' must be a non-empty valid Unix absolute path.")

        # Validate isiVolumePathPermissions if defined
        if "isiVolumePathPermissions" in item:
            perms = item["isiVolumePathPermissions"]
            if not isinstance(perms, str) or not perms.strip().isdigit():
                msg = (
                    f"{cluster_prefix}: 'endpointPort' must be an "
                    "integer between 1 and 65535."
                )
                cluster_errors.append(msg)
    return cluster_errors

def validate_value_file_inputs(values_data):
    """
    Validates csi value file inputs for Omnia.
    """

    value_errors = []

    def add_error(field_path, value, msg):
        value_errors.append(
            f"Validation Error - {field_path}: '{value}' -> {msg}"
        )

    # Helper to safely get nested values
    def get_nested(data, keys, default=None):
        for key in keys:
            if not isinstance(data, dict) or key not in data:
                return default
            data = data[key]
        return data

    # 1. controller.controllerCount == 1
    controller_count = get_nested(values_data, ["controller", "controllerCount"])
    if controller_count != 1:
        add_error("controller.controllerCount", controller_count, "Must be 1")

    # 2. controller.replication.enabled == false
    replication_enabled = get_nested(values_data, ["controller", "replication", "enabled"])
    if replication_enabled is None or replication_enabled is not False:
        add_error("controller.replication.enabled", replication_enabled, "Must be false")

    # 3. controller.resizer.enabled in [true, false]
    resizer_enabled = get_nested(values_data, ["controller", "resizer", "enabled"])
    if resizer_enabled not in [True, False]:
        add_error("controller.resizer.enabled", resizer_enabled, "Must be true or false")

    # 4. controller.snapshot.enabled == true
    snapshot_enabled = get_nested(values_data, ["controller", "snapshot", "enabled"])
    if snapshot_enabled is not True:
        add_error("controller.snapshot.enabled", snapshot_enabled, "Must be true")

    # 5. endpointPort is int in 1..65535
    endpoint_port = values_data.get("endpointPort")
    if endpoint_port is None or not isinstance(endpoint_port, int) or not 1 <= endpoint_port <= 65535:
        add_error("endpointPort", endpoint_port, "Must be between 1 and 65535")

    # 6. skipCertificateValidation == true
    skip_cert = values_data.get("skipCertificateValidation")
    if skip_cert is not True:
        add_error("skipCertificateValidation", skip_cert, "Must be true")

    # 7. isiAuthType in [0, 1]
    isi_auth = values_data.get("isiAuthType")
    if isi_auth not in [0, 1]:
        add_error("isiAuthType", isi_auth, "Must be 0 or 1")

    # 8. isiAccessZone is non-empty string
    isi_access = values_data.get("isiAccessZone")
    if not isi_access or not isinstance(isi_access, str) or not isi_access.strip():
        add_error("isiAccessZone", isi_access, "Must be a non-empty string")

    # 9. isiPath is Unix absolute path
    isi_path = values_data.get("isiPath")
    if not isinstance(isi_path, str) or not isi_path.startswith("/"):
        add_error("isiPath", isi_path, "Must be a valid Unix absolute path")

    # 10. isiVolumePathPermissions is a non-empty string
    permissions = values_data.get("isiVolumePathPermissions")
    if not permissions or not isinstance(permissions, str) or not permissions.strip():
        add_error("isiVolumePathPermissions", permissions, "Must be a valid octal string")

    return value_errors

def encrypt_file(secret_file_path, vault_secret_file_path):
    """
    encrypt the secret file
    """

    cmd = [
        "ansible-vault",
        "encrypt",
        secret_file_path,
        "--vault-password-file",
        vault_secret_file_path,
    ]
    return validation_utils.run_subprocess(cmd)

def decrypt_file(secret_file_path, vault_secret_file_path):
    """
    encrypt the secret file
    Takes 2 inputs: file name and secret file path
    """

    cmd = [
        "ansible-vault",
        "decrypt",
        secret_file_path,
        "--vault-password-file",
        vault_secret_file_path,
    ]
    return validation_utils.run_subprocess(cmd)

def process_encrypted_file(secret_file_path,vault_secret_file_path,errors):
    """
    Process the secret file
    decrypt the file first then parse it to get data
    """

    decrypted_file = decrypt_file(secret_file_path, vault_secret_file_path)
    if decrypted_file:
        try:
            content = Path(secret_file_path).read_text(encoding="utf-8")
            data = yaml.safe_load(content)
            encrypt_file(secret_file_path, vault_secret_file_path)
            return data
        except FileNotFoundError:
            errors.append(create_error_msg("File not found",
                            secret_file_path, "Please check the associated file exists"))
        except yaml.YAMLError:
            errors.append(create_error_msg("Error loading yaml file",
                            secret_file_path, "Please check the associated file syntax"))
    else:
        errors.append(create_error_msg("Error occured when attempting to decrypt file.",
                            secret_file_path, "Please check that the assoicated vault file exists"))
    return decrypted_file

def validate_powerscale_secret_and_values_file(
    secret_file_path, values_file_path,
    errors, input_file_path):
    """
    Driver code to initiate the powerscale secret and values file input validation
    """

    #valiadte secret file inputs
    secrets_file_encrypted = validation_utils.is_file_encrypted(secret_file_path)
    file_path = os.path.dirname(input_file_path)
    vault_secret_file_path = os.path.join(file_path, ".csi_powerscale_secret_vault")

    if secrets_file_encrypted:
        secret_data = process_encrypted_file(secret_file_path, vault_secret_file_path,errors)
        if secret_data is None or secret_data is False:
            errors.append(create_error_msg(
                 "Secret File Load",
                    secret_file_path,
                   "Failed to load or parse secret.yaml file. It may be invalid or empty."
                ))
        else:
            secret_validation_errors = validate_secret_isilon_clusters(secret_data)
            if secret_validation_errors:
                for err in secret_validation_errors:
                    errors.append(
                        create_error_msg("Powerscale Secret File Validation Error:", err, None))

    #validate values file input
    with open(values_file_path, "r", encoding="utf-8") as f:
        values_data = yaml.safe_load(f)
    values_validation_errros = validate_value_file_inputs(values_data)
    if values_validation_errros:
        for value_err in values_validation_errros:
            errors.append(
                create_error_msg(f"Powerscale Value File Validation Error: ",value_err, None))


================================================
FILE: common/library/module_utils/input_validation/validation_flows/gitlab_validation.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# pylint: disable=import-error,no-name-in-module,too-many-positional-arguments,too-many-arguments,unused-argument
"""
Validates gitlab_config.yml input for hosted GitLab deployment.
"""
import ipaddress
import re
from ansible.module_utils.input_validation.common_utils import validation_utils
from ansible.module_utils.input_validation.common_utils import config
from ansible.module_utils.input_validation.common_utils import en_us_validation_msg as msg

file_names = config.files
create_error_msg = validation_utils.create_error_msg
create_file_path = validation_utils.create_file_path

VALID_BRANCH_PATTERN = re.compile(r'^[a-zA-Z0-9][a-zA-Z0-9._\-/]*$')
VALID_VISIBILITY_VALUES = ["private", "internal", "public"]


def validate_gitlab_config(input_file_path, data,
                            logger, module, omnia_base_dir,
                            module_utils_base, project_name):
    """
    Validates gitlab_config.yml by performing logical checks on all user-configurable
    fields including gitlab_host, project settings, port numbers, resource thresholds,
    and OIM API configuration.

    Args:
        input_file_path (str): Path to the input file directory.
        data (dict): Loaded YAML data from gitlab_config.yml.
        logger (Logger): Logger instance.
        module (AnsibleModule): Ansible module instance.
        omnia_base_dir (str): Base directory of Omnia.
        module_utils_base (str): Base directory of module_utils.
        project_name (str): Name of the project.

    Returns:
        list: A list of error dicts encountered during validation.
    """
    errors = []
    gitlab_yml = create_file_path(input_file_path, file_names["gitlab_config"])

    _validate_gitlab_host(data, gitlab_yml, errors, logger)
    _validate_project_settings(data, gitlab_yml, errors)
    _validate_ports(data, gitlab_yml, errors)
    _validate_resource_requirements(data, gitlab_yml, errors)
    _validate_performance_tuning(data, gitlab_yml, errors)
    _validate_oim_settings(data, gitlab_yml, errors)

    return errors


def _validate_gitlab_host(data, gitlab_yml, errors, logger):
    """Validate gitlab_host is a non-empty valid IPv4 address."""
    gitlab_host = data.get("gitlab_host", "")

    if not gitlab_host or not gitlab_host.strip():
        errors.append(create_error_msg(gitlab_yml, "gitlab_host",
                                       msg.GITLAB_HOST_EMPTY_MSG))
        return

    try:
        ipaddress.IPv4Address(gitlab_host.strip())
    except ValueError:
        errors.append(create_error_msg(gitlab_yml, "gitlab_host",
                                       msg.GITLAB_HOST_INVALID_IP_MSG))
        return

    logger.info("gitlab_host validated: %s", gitlab_host)


def _validate_project_settings(data, gitlab_yml, errors):
    """Validate gitlab_project_name, gitlab_project_visibility, and gitlab_default_branch."""
    project_name = data.get("gitlab_project_name", "")
    if not project_name or not str(project_name).strip():
        errors.append(create_error_msg(gitlab_yml, "gitlab_project_name",
                                       msg.GITLAB_PROJECT_NAME_EMPTY_MSG))

    visibility = data.get("gitlab_project_visibility", "")
    if visibility not in VALID_VISIBILITY_VALUES:
        errors.append(create_error_msg(gitlab_yml, "gitlab_project_visibility",
                                       msg.GITLAB_PROJECT_VISIBILITY_INVALID_MSG))

    branch = data.get("gitlab_default_branch", "")
    if not branch or not str(branch).strip():
        errors.append(create_error_msg(gitlab_yml, "gitlab_default_branch",
                                       msg.GITLAB_DEFAULT_BRANCH_EMPTY_MSG))
    elif not VALID_BRANCH_PATTERN.match(str(branch)):
        errors.append(create_error_msg(gitlab_yml, "gitlab_default_branch",
                                       msg.GITLAB_DEFAULT_BRANCH_INVALID_MSG))


def _validate_ports(data, gitlab_yml, errors):
    """Validate gitlab_https_port and gitlab_ssh_port are valid port numbers."""
    https_port = data.get("gitlab_https_port")
    if https_port is not None:
        if not isinstance(https_port, int) or not 1 <= https_port <= 65535:
            errors.append(create_error_msg(gitlab_yml, "gitlab_https_port",
                                           msg.GITLAB_HTTPS_PORT_INVALID_MSG))

    ssh_port = data.get("gitlab_ssh_port")
    if ssh_port is not None:
        if not isinstance(ssh_port, int) or not 1 <= ssh_port <= 65535:
            errors.append(create_error_msg(gitlab_yml, "gitlab_ssh_port",
                                           msg.GITLAB_SSH_PORT_INVALID_MSG))

    if (https_port is not None and ssh_port is not None
            and isinstance(https_port, int) and isinstance(ssh_port, int)
            and https_port == ssh_port):
        errors.append(create_error_msg(gitlab_yml, "gitlab_https_port",
                                       msg.GITLAB_PORTS_CONFLICT_MSG))


def _validate_resource_requirements(data, gitlab_yml, errors):
    """Validate minimum storage, memory, and CPU requirements."""
    min_storage = data.get("gitlab_min_storage_gb")
    if min_storage is not None:
        if not isinstance(min_storage, int) or min_storage < 10:
            errors.append(create_error_msg(gitlab_yml, "gitlab_min_storage_gb",
                                           msg.GITLAB_MIN_STORAGE_INVALID_MSG))

    min_memory = data.get("gitlab_min_memory_gb")
    if min_memory is not None:
        if not isinstance(min_memory, int) or min_memory < 1:
            errors.append(create_error_msg(gitlab_yml, "gitlab_min_memory_gb",
                                           msg.GITLAB_MIN_MEMORY_INVALID_MSG))

    min_cpu = data.get("gitlab_min_cpu_cores")
    if min_cpu is not None:
        if not isinstance(min_cpu, int) or min_cpu < 1:
            errors.append(create_error_msg(gitlab_yml, "gitlab_min_cpu_cores",
                                           msg.GITLAB_MIN_CPU_INVALID_MSG))


def _validate_performance_tuning(data, gitlab_yml, errors):
    """Validate puma workers and sidekiq concurrency values."""
    puma_workers = data.get("gitlab_puma_workers")
    if puma_workers is not None:
        if not isinstance(puma_workers, int) or not 1 <= puma_workers <= 64:
            errors.append(create_error_msg(gitlab_yml, "gitlab_puma_workers",
                                           msg.GITLAB_PUMA_WORKERS_INVALID_MSG))

    sidekiq_concurrency = data.get("gitlab_sidekiq_concurrency")
    if sidekiq_concurrency is not None:
        if not isinstance(sidekiq_concurrency, int) or not 1 <= sidekiq_concurrency <= 200:
            errors.append(create_error_msg(gitlab_yml, "gitlab_sidekiq_concurrency",
                                           msg.GITLAB_SIDEKIQ_CONCURRENCY_INVALID_MSG))


def _validate_oim_settings(data, gitlab_yml, errors):
    """Validate oim_api_verify_ssl is a boolean."""
    oim_verify_ssl = data.get("oim_api_verify_ssl")
    if oim_verify_ssl is not None and not isinstance(oim_verify_ssl, bool):
        errors.append(create_error_msg(gitlab_yml, "oim_api_verify_ssl",
                                       msg.GITLAB_OIM_VERIFY_SSL_INVALID_MSG))


================================================
FILE: common/library/module_utils/input_validation/validation_flows/high_availability_validation.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# pylint: disable=too-many-arguments,too-many-locals,too-many-positional-arguments,import-error
"""
This module contains functions for validating high availability configuration.
"""
import csv
import os
import yaml
from ansible.module_utils.input_validation.common_utils import validation_utils
from ansible.module_utils.input_validation.common_utils import config
from ansible.module_utils.input_validation.common_utils import en_us_validation_msg

file_names = config.files
create_error_msg = validation_utils.create_error_msg
create_file_path = validation_utils.create_file_path
contains_software = validation_utils.contains_software
check_mandatory_fields = validation_utils.check_mandatory_fields


def get_roles_config_json(input_file_path, logger, module, omnia_base_dir, project_name):
    """
    Retrieves the roles configuration from a YAML file.

    Parameters:
        input_file_path (str): The path to the input file.
        logger (Logger): A logger instance.
        module (AnsibleModule): An Ansible module instance.
        omnia_base_dir (str): The base directory of the Omnia project.
        project_name (str): The name of the project.

    Returns:
        dict: The roles configuration as json.
    """
    roles_config_file_path = create_file_path(input_file_path,
                                              file_names["functional_groups_config"])
    roles_config_json = validation_utils.load_yaml_as_json(
        roles_config_file_path, omnia_base_dir, project_name, logger, module
    )

    return roles_config_json


def check_and_validate_ha_role_in_roles_config(errors, roles_config_json, ha_role):
    """
    Validates the HA role in the roles_config.yml file.

    Parameters:
            errors (list): A list to store error messages.
            roles_config_json (dict): A json containing the roles configuration.
            ha_role (str): The name of the HA role to validate.

    Returns:
            None
    """

    # Get groups and roles
    groups_configured = roles_config_json.get("Groups", {})
    roles_configured = roles_config_json.get("Roles", [])

    # Search for HA role and validate its groups
    ha_role_entry = next((role for role in roles_configured if role.get("name") == ha_role), None)

    if ha_role_entry:
        missing_groups = [g for g in ha_role_entry.get("groups", []) if g not in groups_configured]
        for group in missing_groups:
            errors.append(
                create_error_msg(
                    f"group: '{group}' associated for role",
                    ha_role,
                    en_us_validation_msg.GROUP_NOT_FOUND,
                )
            )
    else:
        errors.append(create_error_msg("role", ha_role, en_us_validation_msg.ROLE_NODE_FOUND))


def get_admin_static_dynamic_ranges(network_spec_json):
    """
    This function takes a network specification JSON object as input
    and returns a dictionary containing the static and dynamic ranges
    of the admin network.

    Args:
        network_spec_json (dict): A JSON object containing the network specification.

    Returns:
        dict: A dictionary containing the static and dynamic ranges of the admin network.
    """
    admin_network = {}
    for network in network_spec_json["Networks"]:
        for key, value in network.items():
            if key == "admin_network":
                static_range = value.get("static_range", "N/A")
                dynamic_range = value.get("dynamic_range", "N/A")
                admin_network = {
                    "static_range": static_range,
                    "dynamic_range": dynamic_range,
                }
    return admin_network


def get_bmc_network(network_spec_json):
    """
    Returns the BMC network configuration from the network specification JSON.

    Parameters:
        network_spec_json (dict): The network specification JSON.

    Returns:
        dict: The BMC network configuration,
        containing dynamic_range and dynamic_conversion_static_range.
    """
    bmc_network = {}
    for network in network_spec_json["Networks"]:
        for key, value in network.items():
            if key == "bmc_network":
                static_range = value.get("dynamic_range", "N/A")
                dynamic_range = value.get("dynamic_conversion_static_range", "N/A")
                bmc_network = {
                    "dynamic_range": static_range,
                    "dynamic_conversion_static_range": dynamic_range,
                }
    return bmc_network


def get_admin_netmaskbits(network_spec_json):
    """
    Retrieves the netmask bits for the admin network.

    Parameters:
        network_spec_json (dict): The network specification JSON.

    Returns:
        str: The netmask bits for the admin network, or "N/A" if not found.
    """
    netmaskbits = ""
    for network in network_spec_json["Networks"]:
        for key, value in network.items():
            if key == "admin_network":
                netmaskbits = value.get("netmask_bits", "N/A")
    return netmaskbits


def get_admin_uncorrelated_node_start_ip(network_spec_json):
    """
    Retrieves the get_admin_uncorrelated_node_start_ip for the admin network.

    Parameters:
        network_spec_json (dict): The network specification JSON.

    Returns:
        str: The get_admin_uncorrelated_node_start_ip for the admin network, or "N/A" if not found.
    """
    admin_uncorrelated_node_start_ip = ""
    for network in network_spec_json["Networks"]:
        for key, value in network.items():
            if key == "admin_network":
                admin_uncorrelated_node_start_ip = value.get(
                    "admin_uncorrelated_node_start_ip", "N/A"
                )
    return admin_uncorrelated_node_start_ip


def get_admin_nic_name(network_spec_json):
    """
    Retrieves the oim_nic_name for the admin network.

    Parameters:
        network_spec_json (dict): The network specification JSON.

    Returns:
        str: The oim_nic_name for the admin network, or "N/A" if not found.
    """
    admin_nic_name = ""
    for network in network_spec_json["Networks"]:
        for key, value in network.items():
            if key == "admin_network":
                admin_nic_name = value.get("oim_nic_name", "N/A")
    return admin_nic_name


def get_bmc_nic_name(network_spec_json):
    """
    Retrieves the oim_nic_name for the admin network.

    Parameters:
        network_spec_json (dict): The network specification JSON.

    Returns:
        str: The oim_nic_name for the bmc network, or "N/A" if not found.
    """
    bmc_nic_name = ""
    for network in network_spec_json["Networks"]:
        for key, value in network.items():
            if key == "bmc_network":
                bmc_nic_name = value.get("oim_nic_name", "N/A")
    return bmc_nic_name


def get_primary_oim_admin_ip(network_spec_json):
    """
    This function retrieves the primary OIM admin IP address from a given network spec JSON object.

    Args:
        network_spec_json (dict): The JSON object containing the network specifications.

    Returns:
        str: The primary OIM admin IP address or "N/A" if not found.
    """
    oim_admin_ip = ""
    for network in network_spec_json["Networks"]:
        for key, value in network.items():
            if key == "admin_network":
                oim_admin_ip = value.get("primary_oim_admin_ip", "N/A")
    return oim_admin_ip


def is_service_tag_present(service_tags_list, input_service_tag):
    """
    Checks if a service tag is present in a given list of service tags.

    Args:
        service_tags_list (list): A list of service tags.
        input_service_tag (str): The service tag to be checked.

    Returns:
        bool: True if the service tag is present, False otherwise.
    """
    return input_service_tag in service_tags_list


def validate_service_tag_presence(
    errors, config_type, all_service_tags, active_node_service_tag, passive_nodes
):
    """
    Validates the presence of service tags in the given list of all service tags.

    Parameters:
        errors (list): A list to store error messages.
        config_type (str): The type of configuration being validated.
        all_service_tags (list): A list of all service tags.
        active_node_service_tag (str): The service tag of the active node.
        passive_nodes (list): A list of passive nodes with their service tags.

    Returns:
        None
    """
    # validate_active_node_uniqueness
    if active_node_service_tag and is_service_tag_present(
        all_service_tags, active_node_service_tag
    ):
        errors.append(
            create_error_msg(
                f"{config_type}",
                active_node_service_tag,
                en_us_validation_msg.DUPLICATE_ACTIVE_NODE_SERVICE_TAG,
            )
        )

    # validate passive_node_uniqueness
    for node_service_tags in passive_nodes:
        for service_tag in node_service_tags.get("node_service_tags", []):
            if service_tag == active_node_service_tag or is_service_tag_present(
                all_service_tags, service_tag
            ):
                errors.append(
                    create_error_msg(
                        f"{config_type}",
                        service_tag,
                        en_us_validation_msg.DUPLICATE_PASSIVE_NODE_SERVICE_TAG,
                    )
                )


def validate_vip_address(
    errors,
    config_type,
    vip_address,
    admin_network,
    pod_external_ip_list,
    admin_netmaskbits,
    oim_admin_ip
):
    """
        Validate a virtual IP address against a list of existing service node VIPs,
    admin network static and dynamic ranges, and admin subnet.

        Parameters:
        - errors (list): A list to store error messages.
        - config_type (str): The type of configuration being validated.
        - vip_address (str): The virtual IP address to be validated.
        - pod_external_ip_list (list): A list of external IP addresses associated with the pods
        - admin_network (dict): A dictionary containing admin network configuration.
        - admin_netmaskbits (str): The netmask bits value of the admin network.
        - oim_admin_ip (str): The IP address of the OIM admin interface.

        Returns:
        - None: The function does not return any value, it only appends
            error messages to the errors list.
    """

    if vip_address == oim_admin_ip:
        errors.append(
            create_error_msg(
                f"{config_type} virtual_ip_address",
                vip_address,
                en_us_validation_msg.VIRTUAL_IP_SAME_AS_PRIMARY_OIM_ADMIN_IP,
            )
        )

    # virtual_ip_address is mutually exclusive with admin dynamic ranges
    vip_within_dynamic_range = validation_utils.is_ip_within_range(
        admin_network["dynamic_range"], vip_address
    )

    if vip_within_dynamic_range:
        errors.append(
            create_error_msg(
                f"{config_type} virtual_ip_address",
                vip_address,
                en_us_validation_msg.VIRTUAL_IP_NOT_VALID,
            )
        )

    # validate virtual_ip_address is in the admin subnet
    if not validation_utils.is_ip_in_subnet(oim_admin_ip, admin_netmaskbits, vip_address):
        errors.append(
            create_error_msg(
                f"{config_type} virtual_ip_address",
                vip_address,
                en_us_validation_msg.VIRTUAL_IP_NOT_IN_ADMIN_SUBNET,
            )
        )

    # pod external
    for pod_ext in pod_external_ip_list:
        vip_within_pod_external = validation_utils.is_ip_within_range(
            pod_ext, vip_address
        )

        if vip_within_pod_external:
            errors.append(
                create_error_msg(
                    f"{config_type} vip in pod external",
                    vip_address,
                    en_us_validation_msg.VIRTUAL_IP_NOT_POD_EXT,
                )
            )

def validate_service_k8s_cluster_ha(
    errors,
    config_type,
    ha_data,
    input_file_path,
    network_spec_data,
    all_service_tags,
    ha_node_vip_list
):
    """
    Validates Kubernetes HA (High Availability) head node configuration for potential issues.
    Args:
        errors (list): A list to which error messages will be appended.
        config_type (str): A string representing the configuration context or type
        ,used in error reporting.
        ha_data (dict): Contains high availability configuration data, including:
            - 'external_loadbalancer_ip' (str): The IP of the external load balancer.
            - 'active_node_service_tag' (list): A list of service tags marked as active.
        network_spec_data (dict): Contains network specification data, including:
            - 'admin_network' (dict): Includes 'static' and 'dynamic' for the admin network.
            - 'oim_admin_ip' (str): The OIM admin IP.
            - 'admin_uncorrelated_node_start_ip' (str): Starting IP for uncorrelated admin nodes.
        roles_config_json (dict): Reserved for future role-based validations (currently unused).
        all_service_tags (list): A list of all service tags defined in the system.
        ha_node_vip_list (list): List of virtual IPs assigned to HA nodes (currently unused).

    Returns:
        None: Errors are collected in the provided `errors` list.
    """
    admin_network = network_spec_data["admin_network"]
    admin_dynamic_range = admin_network.get("dynamic_range", "N/A")
    admin_netmaskbits = network_spec_data.get("admin_netmaskbits")
    oim_admin_ip = network_spec_data["oim_admin_ip"]

    with open(os.path.join(input_file_path, "provision_config.yml"), "r", encoding="utf-8") as f:
        prov_cfg = yaml.safe_load(f)

    with open(prov_cfg.get('pxe_mapping_file_path'), newline='', encoding='utf-8') as csvfile:
        pxe_list = list(csv.DictReader(csvfile, delimiter=","))
        pxe_admin_ips = [item["ADMIN_IP"] for item in pxe_list]
        pxe_bmc_ips   = [item["BMC_IP"]   for item in pxe_list]

    with open(os.path.join(input_file_path, "omnia_config.yml"), "r", encoding="utf-8") as omniacfg:
        omnia_config =  yaml.safe_load(omniacfg)
        pod_external_ip_list = [item.get("pod_external_ip_range")
                                for item in omnia_config.get('service_k8s_cluster')
                                if item.get('deployment', False)]

    if not isinstance(ha_data, list):
        ha_data = [ha_data]
    for hdata in ha_data:
        does_overlap = []
        vip_address = hdata.get("virtual_ip_address")
        # Find the intersection
        if vip_address:
            for ip_list in (ha_node_vip_list, pxe_admin_ips, pxe_bmc_ips):
                if vip_address in ip_list:
                    errors.append(
                        create_error_msg(
                            f"{config_type} virtual_ip_duplicate",
                            vip_address,
                            en_us_validation_msg.DUPLICATE_VIRTUAL_IP))
            validate_vip_address(
                errors,
                config_type,
                vip_address,
                admin_network,
                pod_external_ip_list,
                admin_netmaskbits,
                oim_admin_ip
            )


def load_network_spec(input_file_path):
    """
    Loads network specification from a YAML file and returns it as a dictionary.

    Args:
        input_file_path (str): The path to the directory containing the YAML file.

    Returns:
        dict: A dictionary containing network specification information.
    """
    with open(os.path.join(input_file_path, "network_spec.yml"), "r", encoding="utf-8") as f:
        network_spec_json = yaml.safe_load(f)
    network_spec_info = {
        "admin_network": get_admin_static_dynamic_ranges(network_spec_json),
        "admin_nic_name": get_admin_nic_name(network_spec_json),
        "bmc_network": get_bmc_network(network_spec_json),
        "bmc_nic_name": get_bmc_nic_name(network_spec_json),
        "admin_netmaskbits": get_admin_netmaskbits(network_spec_json),
        "admin_uncorrelated_node_start_ip": get_admin_uncorrelated_node_start_ip(
            network_spec_json
        ),
        "oim_admin_ip": get_primary_oim_admin_ip(network_spec_json)
    }
    return network_spec_info

def validate_ha_config(ha_data, mandatory_fields, errors, config_type,
                       input_file_path, all_service_tags, ha_node_vip_list):
    """
    Validates high availability configuration.

    Args:
        ha_data (dict): The high availability configuration data.
        mandatory_fields (list): The list of mandatory fields in the HA configuration.
        errors (list): The list to store error messages.
        config_type (str): The type of HA configuration.
        input_file_path (str): The path to the directory containing the YAML file.
        all_service_tags (list): The list of all service tags.
        ha_node_vip_list (list): The list of HA node VIPs.

    Returns:
        None
    """
    ha_validation = {
        "service_k8s_cluster_ha": validate_service_k8s_cluster_ha
    }
    network_spec_info = load_network_spec(input_file_path)
    check_mandatory_fields(mandatory_fields, ha_data, errors)
    if config_type in ha_validation:
        ha_validation[config_type](
            errors,
            config_type,
            ha_data,
            input_file_path,
            network_spec_info,
            all_service_tags,
            ha_node_vip_list)

def validate_high_availability_config(
    input_file_path, data, logger, module, omnia_base_dir, _module_utils_base, project_name
):
    """
    Validates high availability configuration for different ha config types.

    Parameters:
        input_file_path (str): The path of the input file.
        data (dict): The data to be validated.
        logger (Logger): The logger object.
        module (AnsibleModule): The Ansible module object.
        omnia_base_dir (str): The base directory of Omnia.
        module_utils_base (str): The base directory of module_utils.
        project_name (str): The name of the project.

    Returns:
        list: A list of errors found during validation.
    """
    errors = []
    ha_node_vip_list = []
    all_service_tags = set()

    ha_configs = [
        ("service_k8s_cluster_ha", ["virtual_ip_address"], "enable_k8s_ha")
    ]

    for config_name, mandatory_fields, enable_key in ha_configs:
        ha_data = data.get(config_name)
        if ha_data:
            ha_data = ha_data[0] if isinstance(ha_data, list) else ha_data
            # Check if HA is enabled before validating
            if ha_data.get(enable_key, False):
                validate_ha_config(ha_data, mandatory_fields, errors, config_name,
                                    os.path.dirname(input_file_path),
                                    all_service_tags, ha_node_vip_list)
            else:
                logger.info(f"HA is disabled for {config_name} ({enable_key}=false), skipping validation.")
        else:
            logger.warning(f"Configuration for {config_name} not found.")

    return errors


================================================
FILE: common/library/module_utils/input_validation/validation_flows/local_repo_validation.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# pylint: disable=import-error,no-name-in-module,too-many-positional-arguments,too-many-arguments,unused-argument
"""
Validates local repository configuration files for Omnia.
"""
import os
import glob
import re
from ansible.module_utils.input_validation.common_utils import validation_utils
from ansible.module_utils.input_validation.common_utils import config
from ansible.module_utils.input_validation.common_utils import en_us_validation_msg
from ansible.module_utils.local_repo.software_utils import load_yaml, load_json

file_names = config.files
create_error_msg = validation_utils.create_error_msg
create_file_path = validation_utils.create_file_path


def check_subscription_status(logger=None):
    """
    Check if the system has an active Red Hat subscription enabled.
    If system entitlement certificates are found in /etc/pki/entitlement,
    only system paths are checked. Otherwise, Omnia paths are checked.
    Subscription is enabled only if entitlement certificates and required
    Red Hat repository URLs are found in the same source (system or Omnia).

    Returns:
        bool: True if subscription is enabled (both entitlement certs
              and repos are found in the same source), False otherwise.
    """
    # 1. Check system entitlement certs first
    system_entitlement_certs = glob.glob(config.SYSTEM_ENTITLEMENT_PATH)
    has_system_entitlement = len(system_entitlement_certs) > 0
    
    if has_system_entitlement:
        # System entitlement found - use system paths only
        entitlement_certs = system_entitlement_certs
        has_entitlement = True
        repo_file_to_check = config.SYSTEM_REDHAT_REPO
        
        if logger:
            logger.info(f"Found {len(system_entitlement_certs)} system entitlement certs - using system paths only")
    else:
        # No system entitlement - check Omnia paths
        omnia_entitlement_certs = glob.glob(config.OMNIA_ENTITLEMENT_PATH)
        entitlement_certs = omnia_entitlement_certs
        has_entitlement = len(omnia_entitlement_certs) > 0
        repo_file_to_check = config.OMNIA_REDHAT_REPO
        
        if logger:
            logger.info(f"No system entitlement found - checking Omnia paths: {len(omnia_entitlement_certs)} certs found")

    # 2. Check repos based on which entitlement path was used
    has_repos = False
    repo_urls = []
    redhat_repo_used = None
    
    if os.path.exists(repo_file_to_check):
        try:
            with open(repo_file_to_check, "r") as f:
                for line in f:
                    if line.startswith("baseurl ="):
                        url = line.split("=", 1)[1].strip()
                        if re.search(r"(codeready-builder|baseos|appstream)", url, re.IGNORECASE):
                            repo_urls.append(url)
            
            if repo_urls:
                has_repos = True
                redhat_repo_used = repo_file_to_check
                if logger:
                    logger.info(f"Found {len(repo_urls)} repo URLs in {repo_file_to_check}")
            elif logger:
                logger.info(f"No required repo URLs found in {repo_file_to_check}")
        except (IOError, OSError) as e:
            if logger:
                logger.warning(f"Error reading {repo_file_to_check}: {e}")
    elif logger:
        logger.info(f"Repo file {repo_file_to_check} does not exist")

    # 3. Subscription enabled if entitlement and repos are found in the same source
    subscription_enabled = has_entitlement and has_repos
    
    if logger:
        logger.info(
            f"Subscription enabled: {subscription_enabled} "
            f"(entitlement={has_entitlement}, repos={has_repos}, "
            f"entitlement_source={entitlement_certs[0] if entitlement_certs else 'None'}, "
            f"repo_source={redhat_repo_used})"
        )

    return subscription_enabled

# Below is a validation function for each file in the input folder
def validate_local_repo_config(input_file_path, data,
                               logger, module, omnia_base_dir,
                               module_utils_base, project_name):
    """
    Validates local repo configuration by checking cluster_os_type and
    omnia_repo_url_rhel fields are present and accessible.
    """
    errors = []
    base_repo_names = []
    local_repo_yml = create_file_path(input_file_path, file_names["local_repo_config"])
    
    user_registry = data.get("user_registry") 
    if user_registry:
        for registry in user_registry:
            host = registry.get("host")
            cert_path = registry.get("cert_path")
            key_path = registry.get("key_path")
            
            # Validate user_registry certificate and key paths
            if cert_path and not os.path.exists(cert_path):
                errors.append(create_error_msg(local_repo_yml, "user_registry", 
                                             f"Certificate file not found: {cert_path}"))
            
            if key_path and not os.path.exists(key_path):
                errors.append(create_error_msg(local_repo_yml, "user_registry", 
                                             f"Key file not found: {key_path}"))

    # Validate user_repo_url name prefixes
    user_repo_prefix_map = {
        "user_repo_url_x86_64": "x86_64_",
        "user_repo_url_aarch64": "aarch64_",
    }
    for repo_key, expected_prefix in user_repo_prefix_map.items():
        user_repos = data.get(repo_key)
        if user_repos:
            for repo in user_repos:
                repo_name = repo.get("name", "")
                if repo_name and not repo_name.startswith(expected_prefix):
                    errors.append(create_error_msg(
                        local_repo_yml, repo_key,
                        en_us_validation_msg.USER_REPO_NAME_PREFIX_FAIL_MSG.format(
                            repo_name=repo_name,
                            repo_key=repo_key,
                            expected_prefix=expected_prefix
                        )
                    ))

    repo_names = {}
    sub_result = check_subscription_status(logger)
    logger.info(f"validate_local_repo_config: Subscription status: {sub_result}")
    all_archs = ['x86_64', 'aarch64']
    url_list = ["omnia_repo_url_rhel", "rhel_os_url", "user_repo_url"]
    for arch in all_archs:
        arch_repo_names = []
        arch_list = url_list + [url+'_'+arch for url in url_list]
         # define base repos dynamically for this arch if subscription registered 
        if sub_result:
            base_subscription_repos = [f"{arch}_baseos", f"{arch}_appstream", f"{arch}_codeready-builder"]
            logger.info(f"Base subscription repos for {arch}: {base_subscription_repos}")
        
        # Collect repo names from standard repo lists
        for repurl in arch_list:
            repos = data.get(repurl)
            if repos:
                arch_repo_names = arch_repo_names + [x.get('name') for x in repos]

        # Handle rhel_subscription_repo_config separately
        # Only add non-base repos to the name list (base repos are overrides, not duplicates)
        subscription_config_key = f"rhel_subscription_repo_config_{arch}"
        subscription_config = data.get(subscription_config_key, [])
        if subscription_config:
            for repo in subscription_config:
                repo_name = repo.get('name')
                if repo_name and repo_name not in base_subscription_repos:
                    # This is a new repo, not an override of base repos
                    arch_repo_names.append(repo_name)
                    logger.info(f"Adding new subscription config repo: {repo_name}")
                else:
                    logger.info(f"Skipping base repo override from duplicate check: {repo_name}")

        # Add additional_repos names for this arch
        additional_repos_key = f"additional_repos_{arch}"
        additional_repos = data.get(additional_repos_key)
        if additional_repos:
            arch_repo_names = arch_repo_names + [x.get('name') for x in additional_repos]
        
        # Add base subscription repos to the final list (they will be dynamically generated)
        if sub_result:
            arch_repo_names = arch_repo_names + base_subscription_repos
        
        repo_names[arch] = arch_repo_names
        logger.info(f"Total repos for {arch}: {repo_names[arch]}")

    for k,v in repo_names.items():
        if len(v) != len(set(v)):
            errors.append(create_error_msg(local_repo_yml, k, "Duplicate repo names found."))
            for c in set(v):
                if v.count(c) > 1:
                    errors.append(create_error_msg(local_repo_yml, k,
                                                f"Repo with name {c} found more than once."))

    software_config_file_path = create_file_path(input_file_path, file_names["software_config"])
    software_config_json = load_json(software_config_file_path)

    # Extra validation: custom_slurm must have <arch>_slurm_custom in user_repo_url_<arch>
    for sw in software_config_json["softwares"]:
        if sw["name"] == "slurm_custom":
            for arch in sw.get("arch", []):
                expected_repo = f"{arch}_slurm_custom"

                # Look specifically under user_repo_url_<arch>
                user_repo_key = f"user_repo_url_{arch}"
                user_repos = data.get(user_repo_key, []) or []

                # Extract names safely
                user_repo_names = [r.get("name") for r in user_repos]

                if expected_repo not in user_repo_names:
                    errors.append(
                        create_error_msg(
                            local_repo_yml,
                            arch,
                            f"Missing required repo '{expected_repo}' in {user_repo_key} for slurm_custom.",
                        )
                    )

    os_ver_path = f"/{software_config_json['cluster_os_type']}/{software_config_json['cluster_os_version']}/"
    supported_subgroups = config.ADDITIONAL_PACKAGES_SUPPORTED_SUBGROUPS
    additional_packages_warnings = False

    for software in software_config_json["softwares"]:
        sw = software["name"]
        arch_list = software.get("arch")
        for arch in arch_list:
            json_path = create_file_path(
            input_file_path,
            f"config/{arch}{os_ver_path}" + sw +".json")
            if not os.path.exists(json_path):
                errors.append(
                    create_error_msg(sw + '/' + arch, f"{sw} JSON file not found for architecture {arch}.", json_path))
            else:
                curr_json = load_json(json_path)
                pkg_list = curr_json[sw]['cluster']
                # For additional_packages, validate subgroup keys in the JSON
                if sw == "additional_packages":
                    if "additional_packages" not in curr_json:
                        logger.warning(
                            f"{sw}/{arch}: {json_path} - "
                            f"Required key 'additional_packages' is missing from the JSON file.")
                        additional_packages_warnings = True
                    arch_supported = supported_subgroups.get(arch, [])
                    user_subgroups = [p.get('name') for p in software_config_json.get(sw, [])]
                    for json_key in curr_json:
                        if json_key == "additional_packages":
                            continue
                        if json_key not in arch_supported:
                            logger.warning(
                                f"{sw}/{arch}: {json_path} - "
                                f"Subgroup '{json_key}' is not supported for architecture {arch}.")
                            additional_packages_warnings = True
                        elif json_key not in user_subgroups:
                            logger.warning(
                                f"{sw}/{arch}: {json_path} - "
                                f"Subgroup '{json_key}' is present in JSON but not listed under additional_packages in software_config.json.")
                            additional_packages_warnings = True
                if sw in software_config_json:
                    for sub_pkg in software_config_json[sw]:
                        sub_sw = sub_pkg.get('name')
                        if sub_sw not in curr_json:
                            # For additional_packages, skip subgroups that
                            # are not supported for this arch, or warn if supported but missing
                            if sw == "additional_packages":
                                if sub_sw not in supported_subgroups.get(arch, []):
                                    continue
                                else:
                                    logger.warning(
                                        f"{sw}/{arch}: {json_path} - "
                                        f"Software {sub_sw} not found in {sw}.")
                                    additional_packages_warnings = True
                                    continue
                            errors.append(
                                create_error_msg(sw + '/' + arch,
                                                json_path,
                                                f"Software {sub_sw} not found in {sw}."))
                        else:
                            pkg_list = pkg_list + curr_json[sub_sw]['cluster']
                for pkg in pkg_list:
                    if pkg.get("type") in ['rpm', 'rpm_list']:
                        repo_name = pkg.get("repo_name")
                        # Skip slurm_custom repo check (already validated above)
                        if sw == "slurm_custom" and repo_name.endswith("_slurm_custom"):
                            continue
                        # Skip base RHEL repo validation if subscription is enabled
                        if sub_result and repo_name in [f"{arch}_baseos", f"{arch}_appstream", f"{arch}_codeready-builder"]:
                            continue
                        if repo_name not in repo_names.get(arch, []):
                            errors.append(
                                create_error_msg(sw + '/' + arch,
                                                 f"Repo name {repo_name} not found.",
                                                json_path))
    
    if additional_packages_warnings:
        logger.info(
            "[INFO] Additional packages validation completed with warnings. "
            "Please review the log file for additional_packages configuration details.")
    
    return errors


================================================
FILE: common/library/module_utils/input_validation/validation_flows/provision_validation.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# pylint: disable=import-error,too-many-arguments,unused-argument,too-many-locals,too-many-positional-arguments
"""
This module contains functions for validating provision configuration.
"""
import json
import os
import re
import itertools
import csv
import yaml
import ipaddress
from ansible.module_utils.input_validation.common_utils import validation_utils
from ansible.module_utils.input_validation.common_utils import config
from ansible.module_utils.input_validation.common_utils import en_us_validation_msg
from ansible.module_utils.input_validation.validation_flows import common_validation

file_names = config.files
create_error_msg = validation_utils.create_error_msg
create_file_path = validation_utils.create_file_path

# Expected header columns (case-insensitive)
required_headers = [
    "FUNCTIONAL_GROUP_NAME",
    "GROUP_NAME",
    "SERVICE_TAG",
    "PARENT_SERVICE_TAG",
    "HOSTNAME",
    "ADMIN_MAC",
    "ADMIN_IP",
    "BMC_MAC",
    "BMC_IP"
]

def validate_functional_groups_separation(pxe_mapping_file_path):
    """
    Validates that groups are not shared between different functional groups in the mapping file.
    Args:
        pxe_mapping_file_path (str): Path to the PXE mapping file.
    Raises:
        ValueError: If groups are shared between different functional groups.
    """
    if not pxe_mapping_file_path or not os.path.isfile(pxe_mapping_file_path):
        raise ValueError(f"PXE mapping file not found: {pxe_mapping_file_path}")

    with open(pxe_mapping_file_path, "r", encoding="utf-8") as fh:
        raw_lines = fh.readlines()

    non_comment_lines = [ln for ln in raw_lines if ln.strip()]
    reader = csv.DictReader(non_comment_lines)

    fieldname_map = {fn.strip().upper(): fn for fn in reader.fieldnames}
    fg_col = fieldname_map.get("FUNCTIONAL_GROUP_NAME")
    group_col = fieldname_map.get("GROUP_NAME")

    if not fg_col or not group_col:
        raise ValueError("FUNCTIONAL_GROUP_NAME or GROUP_NAME column not found in PXE mapping file")

    fg_groups = {}
    errors = []

    for row in reader:
        fg_name = row.get(fg_col, "").strip() if row.get(fg_col) else ""
        group_name = row.get(group_col, "").strip() if row.get(group_col) else ""

        if fg_name and group_name:
            if fg_name not in fg_groups:
                fg_groups[fg_name] = set()
            fg_groups[fg_name].add(group_name)

    # Check for shared groups between different functional groups
    for fg_name1, fg_name2 in itertools.combinations(fg_groups.keys(), 2):
        shared = fg_groups[fg_name1] & fg_groups[fg_name2]
        if shared:
            group_str = ', '.join(shared)
            msg = f"Group is shared between {fg_name1} and {fg_name2} functional groups."
            errors.append(create_error_msg("functional_groups", group_str, msg))

    if errors:
        raise ValueError("PXE mapping file group separation validation errors: " + "; ".join([str(e) for e in errors]))

def validate_slurm_login_compiler_prefix(pxe_mapping_file_path):
    """Validate that slurm_node and login_compiler entries align on architecture suffix when both are present.

    - Functional group suffix must be either _x86_64 or _aarch64 (case-sensitive).
    - When both slurm_node* and login_compiler_node* are present, their suffixes must match.

    Raises ValueError with details if suffixes differ. Prefix differences are allowed.
    """

    if not pxe_mapping_file_path or not os.path.isfile(pxe_mapping_file_path):
        raise ValueError(f"PXE mapping file not found: {pxe_mapping_file_path}")

    with open(pxe_mapping_file_path, "r", encoding="utf-8") as fh:
        raw_lines = fh.readlines()

    non_comment_lines = [ln for ln in raw_lines if ln.strip()]
    reader = csv.DictReader(non_comment_lines)

    fieldname_map = {fn.strip().upper(): fn for fn in reader.fieldnames}
    fg_col = fieldname_map.get("FUNCTIONAL_GROUP_NAME")
    hostname_col = fieldname_map.get("HOSTNAME")

    if not fg_col or not hostname_col:
        raise ValueError("FUNCTIONAL_GROUP_NAME or HOSTNAME column not found in PXE mapping file")

    arch_map = {"slurm_node": [], "login_compiler_node": []}

    for row_idx, row in enumerate(reader, start=2):
        fg_name = row.get(fg_col, "").strip() if row.get(fg_col) else ""
        hostname = row.get(hostname_col, "").strip() if row.get(hostname_col) else ""
        if not fg_name or not hostname:
            continue

        fg_arch = None
        fg_base = fg_name
        for suffix in ("_x86_64", "_aarch64"):
            if fg_name.endswith(suffix):
                fg_arch = suffix.lstrip("_")
                fg_base = fg_name[: -len(suffix)]
                break

        if fg_base in arch_map and fg_arch:
            arch_map[fg_base].append((fg_arch, row_idx))

    if not arch_map["slurm_node"] or not arch_map["login_compiler_node"]:
        return

    slurm_arch, _ = arch_map["slurm_node"][0]
    login_arch, _ = arch_map["login_compiler_node"][0]
    if slurm_arch != login_arch:
        slurm_rows = [str(r[1]) for r in arch_map["slurm_node"]]
        login_rows = [str(r[1]) for r in arch_map["login_compiler_node"]]
        raise ValueError(
            "Architecture suffix mismatch between slurm_node and login_compiler_node. "
            f"slurm_node suffix '{slurm_arch}' vs "
            f"login_compiler_node suffix '{login_arch}' "
            "Ensure both use the same suffix (_x86_64 or _aarch64)."
        )

def validate_duplicate_hostnames_in_mapping_file(pxe_mapping_file_path):
    """
    Validates that HOSTNAME values in the mapping file are unique.
    Args:
        pxe_mapping_file_path (str): Path to the PXE mapping file.
    Raises:
        ValueError: If duplicate hostnames are found.
    """
    if not pxe_mapping_file_path or not os.path.isfile(pxe_mapping_file_path):
        raise ValueError(f"PXE mapping file not found: {pxe_mapping_file_path}")

    with open(pxe_mapping_file_path, "r", encoding="utf-8") as fh:
        raw_lines = fh.readlines()

    non_comment_lines = [ln for ln in raw_lines if ln.strip()]
    reader = csv.DictReader(non_comment_lines)

    fieldname_map = {fn.strip().upper(): fn for fn in reader.fieldnames}
    hostname_col = fieldname_map.get("HOSTNAME")

    if not hostname_col:
        raise ValueError("HOSTNAME column not found in PXE mapping file")

    hostnames = []
    duplicates = []

    for row_idx, row in enumerate(reader, start=2):
        hostname = row.get(hostname_col, "").strip() if row.get(hostname_col) else ""
        if hostname in hostnames:
            duplicates.append(f"'{hostname}' at CSV row {row_idx}")
        else:
            hostnames.append(hostname)

    if duplicates:
        raise ValueError(f"Duplicate HOSTNAME found in PXE mapping file: {'; '.join(duplicates)}")

def validate_duplicate_service_tags_in_mapping_file(pxe_mapping_file_path):
    """
    Validates that SERVICE_TAG values in the mapping file are unique.

    Args:
        pxe_mapping_file_path (str): Path to the PXE mapping file.

    Raises:
        ValueError: If duplicate service tags are found.
    """
    if not pxe_mapping_file_path or not os.path.isfile(pxe_mapping_file_path):
        raise ValueError(f"PXE mapping file not found: {pxe_mapping_file_path}")

    with open(pxe_mapping_file_path, "r", encoding="utf-8") as fh:
        raw_lines = fh.readlines()

    non_comment_lines = [ln for ln in raw_lines if ln.strip()]
    reader = csv.DictReader(non_comment_lines)

    fieldname_map = {fn.strip().upper(): fn for fn in reader.fieldnames}
    st_col = fieldname_map.get("SERVICE_TAG")

    if not st_col:
        raise ValueError("SERVICE_TAG column not found in PXE mapping file")

    service_tags = []
    duplicates = []

    for row_idx, row in enumerate(reader, start=2):
        st = row.get(st_col, "").strip() if row.get(st_col) else ""
        if st in service_tags:
            duplicates.append(f"'{st}' at CSV row {row_idx}")
        else:
            service_tags.append(st)

    if duplicates:
        raise ValueError(f"Duplicate SERVICE_TAG found in PXE mapping file: {'; '.join(duplicates)}")


def validate_duplicate_admin_ips_in_mapping_file(pxe_mapping_file_path):
    """Validates that ADMIN_IP values in the mapping file are unique."""
    if not pxe_mapping_file_path or not os.path.isfile(pxe_mapping_file_path):
        raise ValueError(f"PXE mapping file not found: {pxe_mapping_file_path}")

    with open(pxe_mapping_file_path, "r", encoding="utf-8") as fh:
        raw_lines = fh.readlines()

    non_comment_lines = [ln for ln in raw_lines if ln.strip()]
    reader = csv.DictReader(non_comment_lines)

    fieldname_map = {fn.strip().upper(): fn for fn in reader.fieldnames}
    admin_ip_col = fieldname_map.get("ADMIN_IP")
    hostname_col = fieldname_map.get("HOSTNAME")

    if not admin_ip_col:
        raise ValueError("ADMIN_IP column not found in PXE mapping file")

    seen_admin_ips = {}
    duplicates = []

    for row_idx, row in enumerate(reader, start=2):
        admin_ip = row.get(admin_ip_col, "").strip() if row.get(admin_ip_col) else ""
        hostname = ""
        if hostname_col:
            hostname = row.get(hostname_col, "").strip() if row.get(hostname_col) else ""

        if not admin_ip:
            continue

        if admin_ip in seen_admin_ips:
            first_row = seen_admin_ips[admin_ip]["row"]
            first_host = seen_admin_ips[admin_ip]["hostname"]
            dup_host = hostname or "<empty>"
            first_host_disp = first_host or "<empty>"
            duplicates.append(
                f"'{admin_ip}' at CSV rows {first_row} ({first_host_disp}) and {row_idx} ({dup_host})"
            )
            continue

        seen_admin_ips[admin_ip] = {"row": row_idx, "hostname": hostname}

    if duplicates:
        raise ValueError(f"Duplicate ADMIN_IP found in PXE mapping file: {'; '.join(duplicates)}")


def validate_group_parent_service_tag_consistency_in_mapping_file(pxe_mapping_file_path):
    """Validates that GROUP_NAME has a consistent PARENT_SERVICE_TAG across the mapping file."""
    if not pxe_mapping_file_path or not os.path.isfile(pxe_mapping_file_path):
        raise ValueError(f"PXE mapping file not found: {pxe_mapping_file_path}")

    with open(pxe_mapping_file_path, "r", encoding="utf-8") as fh:
        raw_lines = fh.readlines()

    non_comment_lines = [ln for ln in raw_lines if ln.strip()]
    reader = csv.DictReader(non_comment_lines)

    fieldname_map = {fn.strip().upper(): fn for fn in reader.fieldnames}
    group_col = fieldname_map.get("GROUP_NAME")
    parent_col = fieldname_map.get("PARENT_SERVICE_TAG")

    if not group_col or not parent_col:
        raise ValueError("GROUP_NAME or PARENT_SERVICE_TAG column not found in PXE mapping file")

    group_to_parent = {}
    errors = []

    for row_idx, row in enumerate(reader, start=2):
        group_name = row.get(group_col, "").strip() if row.get(group_col) else ""
        parent = row.get(parent_col, "").strip() if row.get(parent_col) else ""
        if not group_name:
            continue

        if group_name not in group_to_parent:
            group_to_parent[group_name] = {"parent": parent, "row": row_idx}
            continue

        prev_parent = group_to_parent[group_name]["parent"]
        if prev_parent != parent:
            errors.append(
                f"GROUP_NAME '{group_name}' is associated with different PARENT_SERVICE_TAG. "
                f"Found PARENT_SERVICE_TAG='{prev_parent}' at CSV row {group_to_parent[group_name]['row']} and "
                f"PARENT_SERVICE_TAG='{parent}' at CSV row {row_idx}. "
                f"Fix: Use exactly one PARENT_SERVICE_TAG value for same GROUP_NAME. "
            )

    if errors:
        raise ValueError(
            "PXE mapping file GROUP_NAME and PARENT_SERVICE_TAG consistency validation errors: "
            + "\n".join(errors)
        )

def validate_mapping_file_entries(mapping_file_path):
    """
    Validate CSV mapping file without pandas:
        - Mandatory columns (case-insensitive)
        - Non-null/empty values per required column
        - MAC addresses format (ADMIN_MAC, BMC_MAC)
        - Service tags (alphanumeric)
        - Parent service tag (alphanumeric or empty)
        - HOSTNAME format
        - GROUP_NAME format (grp0..grp100)
        - FUNCTIONAL_GROUP_NAME format (alphanumeric and underscores)
        - ADMIN_IP and BMC_IP are valid IPv4 (BMC_IP may be empty)
    Raises:
        ValueError: If the mapping file format is invalid
    """
    if not mapping_file_path or not os.path.isfile(mapping_file_path):
        raise ValueError(f"PXE mapping file not found: {mapping_file_path}")

    with open(mapping_file_path, "r", encoding="utf-8") as fh:
        raw_lines = fh.readlines()

    # Remove blank lines only (preserve header and data). Comments are handled elsewhere.
    non_blank_lines = [ln for ln in raw_lines if ln.strip()]
    if not non_blank_lines:
        raise ValueError("Please provide details in mapping file.")

    reader = csv.DictReader(non_blank_lines)
    if not reader.fieldnames:
        raise ValueError("CSV header not found in mapping file.")

    # Map header names case-insensitively to original names
    fieldname_map = {fn.strip().upper(): fn for fn in reader.fieldnames}

    # Ensure required headers present
    for hdr in required_headers:
        if hdr not in fieldname_map:
            raise ValueError(f"Missing mandatory column: {hdr} in mapping file.")

    # Pre-compile regexes
    mac_re = re.compile(r"^([0-9A-Fa-f]{2}[:-]){5}[0-9A-Fa-f]{2}$")
    hostname_re = re.compile(r"^[a-zA-Z0-9]([a-zA-Z0-9\-]{0,61}[a-zA-Z0-9])?$")
    group_re = re.compile(r"^grp(?:[0-9]|[1-9][0-9]|100)$")
    fg_re = re.compile(r"^[A-Za-z0-9_]+$")

    row_seen = False
    for row_idx, row in enumerate(reader, start=2):  # start=2 approximates CSV row number
        row_seen = True
        # Check presence and non-empty for all required headers
        for hdr in required_headers:
            col = fieldname_map[hdr]
            val = row.get(col)
            if val is None or str(val).strip() == "":
                if hdr == "PARENT_SERVICE_TAG":
                    # allow empty parent service tag; ensure None becomes empty string for later
                    #.strip() calls
                    if val is None:
                        row[fieldname_map[hdr]] = ""
                    continue
                raise ValueError(f"Null or empty value in column: {hdr} at CSV row {row_idx} in mapping file.")

        # Extract normalized values
        svc = row.get(fieldname_map["SERVICE_TAG"]).strip()
        parent = row.get(fieldname_map["PARENT_SERVICE_TAG"]).strip()
        hostname = row.get(fieldname_map["HOSTNAME"]).strip()
        admin_mac = row.get(fieldname_map["ADMIN_MAC"]).strip()
        bmc_mac = row.get(fieldname_map["BMC_MAC"]).strip()
        admin_ip = row.get(fieldname_map["ADMIN_IP"]).strip()
        bmc_ip = row.get(fieldname_map["BMC_IP"]).strip()
        group_name = row.get(fieldname_map["GROUP_NAME"]).strip()
        fg_name = row.get(fieldname_map["FUNCTIONAL_GROUP_NAME"]).strip()

        # Service tags: alphanumeric
        if not svc.isalnum():
            raise ValueError(f"Invalid SERVICE_TAG: '{svc}' at CSV row {row_idx} in mapping file. Must be alphanumeric.")

        # Parent service tag: allow empty, otherwise alphanumeric
        if parent and not parent.isalnum():
            raise ValueError(f"Invalid PARENT_SERVICE_TAG: '{parent}' at CSV row {row_idx} in mapping file. "
            "Must be alphanumeric or empty.")

        # MAC addresses
        if not mac_re.match(admin_mac):
            raise ValueError(f"Invalid ADMIN_MAC: '{admin_mac}' at CSV row {row_idx} in mapping file.")
        if not mac_re.match(bmc_mac):
            raise ValueError(f"Invalid BMC_MAC: '{bmc_mac}' at CSV row {row_idx} in mapping file.")

        # Hostname
        if not hostname_re.match(hostname):
            raise ValueError(f"Invalid HOSTNAME: '{hostname}' at CSV row {row_idx} in mapping file.")

        # GROUP_NAME format
        if not group_re.match(group_name):
            raise ValueError(f"Invalid GROUP_NAME: '{group_name}' at CSV row {row_idx} in mapping file. Must be in format grp0 to grp100.")

        # FUNCTIONAL_GROUP_NAME format
        if not fg_re.match(fg_name):
            raise ValueError(f"Invalid FUNCTIONAL_GROUP_NAME: '{fg_name}' at CSV row {row_idx} in mapping file. Must be alphanumeric with underscores.")

        # IP validations (ADMIN_IP required, BMC_IP optional)
        if not validation_utils.validate_ipv4(admin_ip):
            raise ValueError(f"Invalid ADMIN_IP: '{admin_ip}' at CSV row {row_idx} in mapping file.")
        if bmc_ip and not validation_utils.validate_ipv4(bmc_ip):
            raise ValueError(f"Invalid BMC_IP: '{bmc_ip}' at CSV row {row_idx} in mapping file.")

    if not row_seen:
        raise ValueError("Please provide details in mapping file.")

def validate_functional_groups_in_mapping_file(pxe_mapping_file_path):
    """
    Validates the PXE mapping file format.

    Args:
        pxe_mapping_file_path (str): Path to the PXE mapping file.

    Raises:
        ValueError: If the PXE mapping file format is invalid.
    """

    if not pxe_mapping_file_path or not os.path.isfile(pxe_mapping_file_path):
        raise ValueError(f"PXE mapping file not found: {pxe_mapping_file_path}")

    with open(pxe_mapping_file_path, "r", encoding="utf-8") as fh:
        raw_lines = fh.readlines()
    # Disallow any comment lines in the PXE mapping file
    comment_lines = [i + 1 for i, ln in enumerate(raw_lines) if ln.lstrip().startswith("#")]
    if comment_lines:
        raise ValueError(
            f"PXE mapping file must not contain comments. Comment lines found at: {', '.join(map(str, comment_lines))}"
        )

    # Remove blank lines only; after the check above there are no comment lines
    non_comment_lines = [ln for ln in raw_lines if ln.strip()]
    if not non_comment_lines:
        raise ValueError(f"PXE mapping file is empty: {pxe_mapping_file_path}")

    # Use csv.DictReader on the filtered lines
    reader = csv.DictReader(non_comment_lines)
    if not reader.fieldnames:
        raise ValueError(f"CSV header not found in PXE mapping file: {pxe_mapping_file_path}")

    # Normalize header names for case-insensitive matching
    fieldname_map = {fn.strip().upper(): fn for fn in reader.fieldnames}

    fg_col = fieldname_map.get("FUNCTIONAL_GROUP_NAME")
    if not fg_col:
        raise ValueError("FUNCTIONAL_GROUP_NAME column not found in PXE mapping file")

    invalid_entries = []
    # Iterate rows and validate FG names
    for row_idx, row in enumerate(reader, start=2):  # start=2 approximates line number of first data row
        raw_fg = row.get(fg_col, "")
        fg = raw_fg.strip() if raw_fg is not None else ""
        if not fg:
            invalid_entries.append(f"empty functional group name at CSV row {row_idx}")
        elif fg not in config.FUNCTIONAL_GROUP_LAYER_MAP.keys():
            invalid_entries.append(f"unrecognized functional group name '{fg}' at CSV row {row_idx}")

    if invalid_entries:
        raise ValueError("PXE mapping file functional group name validation errors: " + "; ".join(invalid_entries))

def validate_parent_service_tag_hierarchy(pxe_mapping_file_path):
    """
    Validates the parent service tag hierarchy in the PXE mapping file.
    
    Ensures that:
    - kube_control_plane and kube_node functional groups in slurm nodes have a parent_service_tag
    - Management nodes (login, compiler, control plane) do not have a parent_service_tag
    
    Args:
        pxe_mapping_file_path (str): Path to the PXE mapping file.
    
    Raises:
        ValueError: If the parent service tag hierarchy is invalid.
    """
    if not pxe_mapping_file_path or not os.path.isfile(pxe_mapping_file_path):
        raise ValueError(f"PXE mapping file not found: {pxe_mapping_file_path}")
    with open(pxe_mapping_file_path, "r", encoding="utf-8") as fh:
        raw_lines = fh.readlines()
    non_comment_lines = [ln for ln in raw_lines if ln.strip()]
    reader = csv.DictReader(non_comment_lines)
    fieldname_map = {fn.strip().upper(): fn for fn in reader.fieldnames}
    fg_col = fieldname_map.get("FUNCTIONAL_GROUP_NAME")
    parent_col = fieldname_map.get("PARENT_SERVICE_TAG")
    if not fg_col or not parent_col:
        raise ValueError("Required columns FUNCTIONAL_GROUP_NAME or PARENT_SERVICE_TAG not found")
    hierarchy_errors = []
    # Read all rows so we can pre-scan for a kube cluster and still iterate below
    rows = list(reader)

    # Detect if any row contains a kube control plane or kube node FG
    kube_cluster_present = any(
        ("kube_" in (row.get(fg_col) or "").strip().lower())
        for row in rows
    )
    kube_srv_tags = [row.get('SERVICE_TAG') for row in rows if 'kube_node' in row.get("FUNCTIONAL_GROUP_NAME")]
    # Replace reader with an iterator over the stored rows so the loop below can consume them
    reader_iter = iter(rows)
    for row_idx, row in enumerate(reader_iter, start=2):
        fg = row.get(fg_col, "").strip()
        parent = row.get(parent_col, "").strip() if row.get(parent_col) else ""
        # Get the layer for this functional group
        layer = config.FUNCTIONAL_GROUP_LAYER_MAP.get(fg)
        if layer == "management":
            # Management nodes should NOT have a parent
            if parent:
                hierarchy_errors.append(
                    f"Management node with functional group '{fg}' at CSV row {row_idx} "
                    f"should not have parent_service_tag, but found: '{parent}'"
                )
        elif layer == "compute" and kube_cluster_present:
            # Compute nodes (slurm_node) MUST have a parent
            if not parent:
                hierarchy_errors.append(
                    f"Compute node with functional group '{fg}' at CSV row {row_idx} "
                    f"must have a parent_service_tag configured"
                )
            elif parent not in kube_srv_tags:
                hierarchy_errors.append(
                    f"Compute node with functional group '{fg}' at CSV row {row_idx} "
                    f"must have a valid parent_service_tag configured as service_kube_node"
                )

    if hierarchy_errors:
        raise ValueError(
            "PXE mapping file parent service tag hierarchy validation errors: " +
            "; ".join(hierarchy_errors)
        )

def validate_admin_ips_against_network_spec(pxe_mapping_file_path, network_spec_path):
    """
    Validates that ADMIN_IP addresses in the mapping file fall within the network ranges
    defined in network_spec.yml.

    Args:
        pxe_mapping_file_path (str): Path to the PXE mapping file.
        network_spec_path (str): Path to the network_spec.yml file.

    Returns:
        list: List of validation errors, empty if no errors found.
    """
    import ipaddress

    errors = []

    if not os.path.isfile(network_spec_path):
        errors.append(
            create_error_msg(
                "network_spec_path",
                network_spec_path,
                en_us_validation_msg.NETWORK_SPEC_FILE_NOT_FOUND_MSG
            )
        )
        return errors

    # Load network_spec.yml
    with open(network_spec_path, "r", encoding="utf-8") as f:
        network_spec = yaml.safe_load(f)

    # Extract admin network configuration
    admin_network_config = None
    for network in network_spec.get("Networks", []):
        if "admin_network" in network:
            admin_network_config = network["admin_network"]
            break

    if not admin_network_config:
        errors.append(
            create_error_msg(
                "admin_network",
                network_spec_path,
                en_us_validation_msg.ADMIN_NETWORK_NOT_FOUND_MSG
            )
        )
        return errors

    # Get network parameters
    primary_oim_admin_ip = admin_network_config.get("primary_oim_admin_ip", "")
    netmask_bits = admin_network_config.get("netmask_bits", "")
    dynamic_range = admin_network_config.get("dynamic_range", "")

    if not primary_oim_admin_ip or not netmask_bits:
        errors.append(
            create_error_msg(
                "primary_oim_admin_ip/netmask_bits",
                network_spec_path,
                en_us_validation_msg.PRIMARY_ADMIN_IP_NETMASK_REQUIRED_MSG
            )
        )
        return errors

    # Calculate the network range
    try:
        network = ipaddress.IPv4Network(
            f"{primary_oim_admin_ip}/{netmask_bits}", strict=False
        )
    except ValueError as e:
        errors.append(
            create_error_msg(
                "network_config",
                network_spec_path,
                f"{en_us_validation_msg.INVALID_NETWORK_CONFIG_MSG} Error: {e}"
            )
        )
        return errors

    # Parse dynamic range if provided
    dynamic_ips = set()
    if dynamic_range:
        try:
            range_parts = dynamic_range.split("-")
            if len(range_parts) == 2:
                start_ip = ipaddress.IPv4Address(range_parts[0].strip())
                end_ip = ipaddress.IPv4Address(range_parts[1].strip())
                current_ip = start_ip
                while current_ip <= end_ip:
                    dynamic_ips.add(str(current_ip))
                    current_ip += 1
        except ValueError as e:
            errors.append(
                create_error_msg(
                    "dynamic_range",
                    network_spec_path,
                    f"{en_us_validation_msg.INVALID_DYNAMIC_RANGE_FORMAT_MSG} Error: {e}"
                )
            )
            return errors

    # Read and validate mapping file
    with open(pxe_mapping_file_path, "r", encoding="utf-8") as fh:
        raw_lines = fh.readlines()

    non_comment_lines = [
        ln for ln in raw_lines if ln.strip() and not ln.strip().startswith("#")
    ]

    if not non_comment_lines:
        return errors  # Empty file, nothing to validate

    reader = csv.DictReader(non_comment_lines)

    # Map header names case-insensitively to original names
    fieldname_map = {fn.strip().upper(): fn for fn in reader.fieldnames}
    admin_ip_col = fieldname_map.get("ADMIN_IP")
    hostname_col = fieldname_map.get("HOSTNAME")

    if not admin_ip_col or not hostname_col:
        errors.append(
            create_error_msg(
                "pxe_mapping_file_headers",
                pxe_mapping_file_path,
                en_us_validation_msg.ADMIN_IP_HOSTNAME_COLUMN_MISSING_MSG
            )
        )
        return errors

    ip_validation_errors = []

    for row_idx, row in enumerate(reader, start=2):
        admin_ip = row.get(admin_ip_col, "").strip() if row.get(admin_ip_col) else ""
        hostname = row.get(hostname_col, "").strip() if row.get(hostname_col) else ""

        if not admin_ip:
            continue

        try:
            ip_addr = ipaddress.IPv4Address(admin_ip)

            # Check if IP is within the network range
            if ip_addr not in network:
                error_detail = (
                    f"Row {row_idx}: ADMIN_IP '{admin_ip}' (host: '{hostname}') "
                    f"is outside the admin network range {network}"
                )
                ip_validation_errors.append(error_detail)
            # Check if IP is in dynamic range (reserved for DHCP)
            elif admin_ip in dynamic_ips:
                error_detail = (
                    f"Row {row_idx}: ADMIN_IP '{admin_ip}' (host: '{hostname}') "
                    f"is in the dynamic DHCP range ({dynamic_range})"
                )
                ip_validation_errors.append(error_detail)
            # Check if IP conflicts with primary OIM admin IP
            elif admin_ip == primary_oim_admin_ip:
                error_detail = (
                    f"Row {row_idx}: ADMIN_IP '{admin_ip}' (host: '{hostname}') "
                    f"conflicts with primary_oim_admin_ip"
                )
                ip_validation_errors.append(error_detail)
        except ValueError:
            pass

    if ip_validation_errors:
        # Add summary message first
        summary_msg = (
            f"ADMIN_IP validation failed for {len(ip_validation_errors)} node(s). "
            f"Expected network range: {network}"
        )
        errors.append(
            create_error_msg(
                "pxe_mapping_file_path",
                pxe_mapping_file_path,
                summary_msg
            )
        )
        # Add each individual error as a separate entry
        for ip_error in ip_validation_errors:
            errors.append(
                create_error_msg(
                    "pxe_mapping_file_path",
                    pxe_mapping_file_path,
                    ip_error
                )
            )

    return errors

def validate_aarch64_local_path_compatibility(pxe_mapping_file_path):
    """
    Validates that aarch64 nodes are not present when using local share path.
    
    Args:
        pxe_mapping_file_path (str): Path to the PXE mapping file.
        
    Raises:
        ValueError: If aarch64 nodes are found with local share path configuration.
    """
    # Check metadata file for omnia_share_option
    metadata_path = "/opt/omnia/.data/oim_metadata.yml"
    
    # Default to Local if metadata doesn't exist or omnia_Share_option is not set
    share_option = "Local"
    
    if os.path.isfile(metadata_path):
        try:
            with open(metadata_path, "r", encoding="utf-8") as f:
                metadata = yaml.safe_load(f) or {}
                
            # Check omnia_share_option in metadata
            share_option = metadata.get("omnia_share_option", "Local")
        except Exception:
            # If there's an error reading metadata, assume Local
            pass
    
    # If share option is NFS, no need to check further
    if share_option.lower() == "nfs":
        return
    
    # Check for aarch64 nodes in PXE mapping file
    with open(pxe_mapping_file_path, "r", encoding="utf-8") as fh:
        raw_lines = fh.readlines()
    
    non_comment_lines = [ln for ln in raw_lines if ln.strip()]
    reader = csv.DictReader(non_comment_lines)
    
    fieldname_map = {fn.strip().upper(): fn for fn in reader.fieldnames}
    fg_col = fieldname_map.get("FUNCTIONAL_GROUP_NAME")
    
    if not fg_col:
        return
    
    aarch64_found = False
    for row in reader:
        fg_name = row.get(fg_col, "").strip() if row.get(fg_col) else ""
        if fg_name and "aarch64" in fg_name.lower():
            aarch64_found = True
            break
    
    if aarch64_found:
        raise ValueError(en_us_validation_msg.PXE_MAPPING_AARCH64_LOCAL_PATH_MSG)

def validate_provision_config(
    input_file_path, data, logger, module, omnia_base_dir, module_utils_base, project_name
):
    """
    Validates the provision configuration.

    Args:
        input_file_path (str): The path to the input file.
        data (dict): The data to be validated.
        logger (Logger): A logger instance.
        module (Module): A module instance.
        omnia_base_dir (str): The base directory of the Omnia configuration.
        module_utils_base (str): The base directory of the module utils.
        project_name (str): The name of the project.

    Returns:
        list: A list of errors encountered during validation.
    """
    errors = []
    software_config_file_path = create_file_path(input_file_path, file_names["software_config"])
    try:
        with open(software_config_file_path, "r", encoding="utf-8") as f:
            software_config_json = json.load(f)
    except json.JSONDecodeError as e:
        # Return error with correct filename using proper format
        return [create_error_msg("JSON syntax error", software_config_file_path, str(e))]

    # Call validate_software_config from common_validation
    software_errors = common_validation.validate_software_config(
        software_config_file_path,
        software_config_json,
        logger,
        module,
        omnia_base_dir,
        module_utils_base,
        project_name,
    )
    errors.extend(software_errors)

    # Validate language setting
    language = data.get("language", "")
    if not language:
        errors.append(
            create_error_msg("language", input_file_path, en_us_validation_msg.LANGUAGE_EMPTY_MSG)
        )
    elif "en_US.UTF-8" not in language:
        errors.append(
            create_error_msg("language", input_file_path, en_us_validation_msg.LANGUAGE_FAIL_MSG)
        )

    enable_build_stream = data.get("enable_build_stream", False)

    # Override from build_stream_config.yml if present
    try:
        build_stream_config_path = create_file_path(input_file_path, file_names["build_stream_config"])
        if os.path.isfile(build_stream_config_path):
            with open(build_stream_config_path, "r", encoding="utf-8") as bfh:
                bs_cfg = yaml.safe_load(bfh) or {}
                enable_build_stream = bs_cfg.get("enable_build_stream", enable_build_stream)
    except Exception:
        # If file missing or malformed, fall back to provided data value
        pass

    pxe_mapping_file_path = data.get("pxe_mapping_file_path", "")
    if pxe_mapping_file_path and validation_utils.verify_path(pxe_mapping_file_path):
        try:
            validate_mapping_file_entries(pxe_mapping_file_path)
            validate_functional_groups_in_mapping_file(pxe_mapping_file_path)
            validate_duplicate_service_tags_in_mapping_file(pxe_mapping_file_path)
            validate_duplicate_hostnames_in_mapping_file(pxe_mapping_file_path)
            validate_duplicate_admin_ips_in_mapping_file(pxe_mapping_file_path)
            validate_group_parent_service_tag_consistency_in_mapping_file(pxe_mapping_file_path)
            validate_functional_groups_separation(pxe_mapping_file_path)
            validate_parent_service_tag_hierarchy(pxe_mapping_file_path)
            validate_slurm_login_compiler_prefix(pxe_mapping_file_path)
            validate_aarch64_local_path_compatibility(pxe_mapping_file_path)

            # Validate ADMIN_IPs against network_spec.yml ranges
            network_spec_path = create_file_path(input_file_path, file_names["network_spec"])
            if os.path.isfile(network_spec_path):
                admin_ip_errors = validate_admin_ips_against_network_spec(
                    pxe_mapping_file_path, network_spec_path
                )
                errors.extend(admin_ip_errors)
        except ValueError as e:
            errors.append(
                create_error_msg(
                    "pxe_mapping_file_path",
                    pxe_mapping_file_path,
                    str(e),
                )
            )
    else:
        errors.append(
            create_error_msg(
                "pxe_mapping_file_path",
                pxe_mapping_file_path,
                en_us_validation_msg.PXE_MAPPING_FILE_PATH_FAIL_MSG,
            )
        )

    default_lease_time = data["default_lease_time"]
    if not validation_utils.validate_default_lease_time(default_lease_time):
        errors.append(
            create_error_msg(
                "default_lease_time",
                default_lease_time,
                en_us_validation_msg.DEFAULT_LEASE_TIME_FAIL_MSG,
            )
        )
    return errors

def validate_network_spec(
    input_file_path, data, logger, module, omnia_base_dir, module_utils_base, project_name
):
    """
    Validates the network specification configuration.
    Args:
        input_file_path (str): Path to the input configuration file
        data (dict): The network specification data to validate
        logger (Logger): Logger instance for logging messages
        module (AnsibleModule): Ansible module instance
        omnia_base_dir (str): Base directory path for Omnia
        module_utils_base (str): Base path for module utilities
        project_name (str): Name of the project

    Returns:
        list: List of validation errors, empty if no errors found
    """
    errors = []

    if not data.get("Networks"):
        errors.append(
            create_error_msg("Networks", None, en_us_validation_msg.ADMIN_NETWORK_MISSING_MSG)
        )
        return errors

    # Extract admin and IB parameters for cross-validation
    admin_netmask_bits = None
    admin_primary_ip = None
    ib_netmask_bits = None
    ib_subnet = None
    ib_present = False

    for network in data["Networks"]:
        if "admin_network" in network and isinstance(network["admin_network"], dict):
            admin_net = network["admin_network"]
            admin_netmask_bits = admin_net.get("netmask_bits", admin_netmask_bits)
            admin_primary_ip = admin_net.get("primary_oim_admin_ip", admin_primary_ip)

        if "ib_network" in network and isinstance(network["ib_network"], dict):
            ib_net = network["ib_network"]
            # Consider IB network present only when config is non-empty
            if ib_net:
                ib_present = True
                ib_netmask_bits = ib_net.get("netmask_bits", ib_netmask_bits)
                ib_subnet = ib_net.get("subnet", ib_subnet)

    # If IB network is configured and both netmask bits are available, they must match
    if ib_present and ib_netmask_bits and admin_netmask_bits and ib_netmask_bits != admin_netmask_bits:
        errors.append(
            create_error_msg(
                "ib_network.netmask_bits",
                ib_netmask_bits,
                en_us_validation_msg.IB_NETMASK_BITS_MISMATCH_MSG,
            )
        )

    # If IB subnet and admin primary IP are available, ensure IB subnet is not in admin range
    if ib_present and ib_subnet and admin_primary_ip and admin_netmask_bits:
        try:
            admin_network = ipaddress.IPv4Network(f"{admin_primary_ip}/{admin_netmask_bits}", strict=False)
            ib_ip = ipaddress.IPv4Address(ib_subnet)
            if ib_ip in admin_network:
                errors.append(
                    create_error_msg(
                        "ib_network.subnet",
                        ib_subnet,
                        en_us_validation_msg.IB_SUBNET_IN_ADMIN_RANGE_MSG,
                    )
                )
        except ValueError:
            # If IPs/netmask are invalid, rely on existing validations to report issues
            pass

    for network in data["Networks"]:
        errors.extend(_validate_admin_network(network))

    return errors


def _validate_admin_network(network):
    """
    Validates the admin network configuration.

    Args:
        network (dict): Admin network configuration dictionary containing network settings

    Returns:
        list: List of validation errors for admin network, empty if no errors found

    Validates:
        - Netmask bits
        - Network gateway
        - Dynamic IP ranges
    """
    errors = []
    if "admin_network" not in network:
        return errors

    admin_net = network["admin_network"]
    primary_oim_admin_ip = admin_net.get("primary_oim_admin_ip", "")
    primary_oim_bmc_ip = admin_net.get("primary_oim_bmc_ip", "")
    dynamic_range = admin_net.get("dynamic_range", "")
    oim_nic_name = admin_net.get("oim_nic_name", "")
    netmask_bits = admin_net.get("netmask_bits", "")

    # Validate netmask_bits
    if "netmask_bits" in admin_net:
        netmask = admin_net["netmask_bits"]
        if not validation_utils.validate_netmask_bits(netmask):
            errors.append(
                create_error_msg(
                    "admin_network.netmask_bits",
                    netmask,
                    en_us_validation_msg.NETMASK_BITS_FAIL_MSG,
                )
            )

    # Validate IP ranges
    if "dynamic_range" in admin_net:
        errors.extend(
            _validate_ip_ranges(
                admin_net["dynamic_range"], "admin_network", netmask
            )
        )

        # Ensure dynamic_range is inside the admin subnet (primary_oim_admin_ip/netmask_bits)
        if not validation_utils.is_range_within_subnet(admin_net["dynamic_range"], primary_oim_admin_ip, netmask):
            errors.append(
                create_error_msg(
                    "admin_network.dynamic_range",
                    admin_net["dynamic_range"],
                    en_us_validation_msg.RANGE_NETMASK_BOUNDARY_FAIL_MSG,
                )
            )

    #  Admin and BMC IP should not be the same
    errors.extend(validate_admin_bmc_ip_not_same(primary_oim_admin_ip, primary_oim_bmc_ip))

    # Both should be valid IPv4 addresses (BMC IP is optional)
    errors.extend(validate_admin_bmc_ip_valid(primary_oim_admin_ip, primary_oim_bmc_ip))

    # Neither should be in the dynamic_range
    errors.extend(validate_admin_bmc_ip_not_in_dynamic_range(primary_oim_admin_ip, primary_oim_bmc_ip, dynamic_range))

    # Ensure primary_oim_admin_ip matches actual NIC IP and netmask
    # Ensure primary_oim_admin_ip matches actual NIC IP and netmask
    if oim_nic_name and primary_oim_admin_ip and netmask_bits:
        nic_ips = validation_utils.get_interface_ips_and_netmasks(oim_nic_name)  # returns list of (ip, netmask_bits)

        # Check if any IP/netmask pair matches
        match_found = any(
            ip == primary_oim_admin_ip and nm == netmask_bits
            for ip, nm in nic_ips
        )

        if not match_found:
            errors.append(
                create_error_msg(
                    "primary_oim_admin_ip",
                    primary_oim_admin_ip,
                    f"{en_us_validation_msg.PRIMARY_ADMIN_IP_INTERFACE_MISMATCH_MSG}: "
                    f"IP/netmask on {oim_nic_name} is {nic_ips}, "
                    f"but network_spec has {primary_oim_admin_ip}/{netmask_bits}."
                )
            )

    return errors

def validate_admin_bmc_ip_not_same(primary_oim_admin_ip, primary_oim_bmc_ip):
    """
    Validates that primary_oim_admin_ip and primary_oim_bmc_ip are not the same.
    """
    errors = []
    if primary_oim_admin_ip and primary_oim_bmc_ip and primary_oim_admin_ip == primary_oim_bmc_ip:
        errors.append(
            create_error_msg(
                "primary_oim_admin_ip",
                primary_oim_admin_ip,
                en_us_validation_msg.PRIMARY_ADMIN_BMC_IP_SAME_MSG
            )
        )
    return errors

def validate_admin_bmc_ip_valid(primary_oim_admin_ip, primary_oim_bmc_ip):
    """
    Validates that both primary_oim_admin_ip and primary_oim_bmc_ip are valid IPv4 addresses.
    """
    errors = []
    if primary_oim_admin_ip and not validation_utils.validate_ipv4(primary_oim_admin_ip):
        errors.append(
            create_error_msg(
                "primary_oim_admin_ip",
                primary_oim_admin_ip,
                en_us_validation_msg.PRIMARY_ADMIN_IP_INVALID_MSG
            )
        )
    if primary_oim_bmc_ip and not validation_utils.validate_ipv4(primary_oim_bmc_ip):
        errors.append(
            create_error_msg(
                "primary_oim_bmc_ip",
                primary_oim_bmc_ip,
                en_us_validation_msg.PRIMARY_BMC_IP_INVALID_MSG
            )
        )
    return errors

def validate_admin_bmc_ip_not_in_dynamic_range(
        primary_oim_admin_ip, primary_oim_bmc_ip, dynamic_range
):
    """
    Validates that neither primary_oim_admin_ip nor primary_oim_bmc_ip are
    within the dynamic_range.
    """
    errors = []
    if dynamic_range:
        if primary_oim_admin_ip and validation_utils.is_ip_within_range(
                dynamic_range, primary_oim_admin_ip
        ):
            errors.append(
                create_error_msg(
                    "primary_oim_admin_ip",
                    primary_oim_admin_ip,
                    en_us_validation_msg.PRIMARY_ADMIN_IP_IN_DYNAMIC_RANGE_MSG
                )
            )
        if primary_oim_bmc_ip and validation_utils.is_ip_within_range(
                dynamic_range, primary_oim_bmc_ip
        ):
            errors.append(
                create_error_msg(
                    "primary_oim_bmc_ip",
                    primary_oim_bmc_ip,
                    en_us_validation_msg.PRIMARY_BMC_IP_IN_DYNAMIC_RANGE_MSG
                )
            )
    return errors

def _validate_ip_ranges(dynamic_range, network_type, netmask_bits):
    """
    Validates a dynamic IP range for a given network type and netmask.

    Args:
        dynamic_range (str): IP range for dynamic addresses (format: "start_ip-end_ip")
        network_type (str): Type of network being validated ("admin_network")
        netmask_bits (str): The netmask bits value to validate IP ranges against

    Returns:
        list: List of validation errors for IP ranges, empty if no errors found

    Validates:
        - Dynamic IP range format.
        - Dynamic IP range is within valid netmask boundaries.
    """
    errors = []

    if not validation_utils.validate_ipv4_range(dynamic_range):
        errors.append(
            create_error_msg(
                f"{network_type}.dynamic_range",
                dynamic_range,
                en_us_validation_msg.RANGE_IP_CHECK_FAIL_MSG,
            )
        )

    return errors


================================================
FILE: common/library/module_utils/input_validation/validation_flows/scheduler_validation.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

# pylint: disable=import-error,no-name-in-module,too-many-positional-arguments,too-many-arguments
"""
L2 level validations for K8s scheduler
"""

from ansible.module_utils.input_validation.common_utils import validation_utils

def validate_k8s_parameters(
        admin_static_range, bmc_static_range,
        admin_dynamic_range, bmc_dynamic_range,
        k8s_service_addresses,
        k8s_pod_network_cidr):
    """
    Validates Kubernetes IP configuration to ensure there is no overlap between defined IP ranges.

    This function checks for overlapping IP ranges across various network segments, including:
    - Admin static and dynamic IP ranges
    - BMC (Baseboard Management Controller) static and dynamic IP ranges
    - Pod external IP range
    - Kubernetes service addresses
    - Kubernetes pod network CIDR

    Parameters:
        admin_static_range (str): IP range for static admin network.
        bmc_static_range (str): IP range for static BMC network.
        admin_dynamic_range (str): IP range for dynamic admin network.
        bmc_dynamic_range (str): IP range for dynamic BMC network.
        pod_external_ip_range (str): External IP range used by pods.
        k8s_service_addresses (str): IP range for Kubernetes services.
        k8s_pod_network_cidr (str): CIDR for Kubernetes pod network.

    Returns:
        list: A list of error messages. If IP ranges overlap, the list contains an error message;
    """
    # Check IP range overlap between omnia IPs, admin network, and bmc network
    results=[]
    ip_ranges = [admin_static_range, bmc_static_range,
                admin_dynamic_range, bmc_dynamic_range,
                k8s_service_addresses,
                k8s_pod_network_cidr]
    does_overlap, _ = validation_utils.check_overlap(ip_ranges)
    if does_overlap:
        results.append("The IP range define is not correct.")
    return results


================================================
FILE: common/library/module_utils/local_repo/__init__.py
================================================


================================================
FILE: common/library/module_utils/local_repo/common_functions.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import os
import subprocess
import stat
import string
import secrets
import base64
from pathlib import Path
import yaml
import toml

def load_yaml_file(path):
    """
    Load YAML from a given file path.

    Args:
        path (str): The path to the YAML file.

    Returns:
        dict: The loaded YAML data.

    Raises:
        FileNotFoundError: If the file does not exist.
    """
    if not os.path.isfile(path):
        raise FileNotFoundError(f"Config file not found: {path}")
    with open(path, "r", encoding = "utf-8") as file:
        return yaml.safe_load(file)

def get_repo_list(config_file, repo_key):
    """
    Retrieve the list of repositories from config using a given key.

    Args:
        config_file (dict): The configuration file data.
        repo_key (str): The key to retrieve the repository list.

    Returns:
        list: The list of repositories.
    """
    return config_file.get(repo_key, [])

def is_file_exists(file_path):
    """
    Check if a file exists at the given path.

    Args:
        file_path (str): The path to the file.

    Returns:
        bool: True if the file exists, False otherwise.
    """
    return os.path.isfile(file_path)

def is_encrypted(file_path):
    """
    Check if a file encrypted at the given path.

    Args:
        file_path (str): The path to the file.

    Returns:
        bool: True if the file encrypted, False otherwise.
    """
    with open(file_path, 'r', encoding = 'utf-8') as f:
        first_line = f.readline()
    return "$ANSIBLE_VAULT" in first_line

def run_vault_command(command, file_path, vault_key):
    """
    Run ansible-vault command at the given path.

    Args:
        command (str): Command to execute
        file_path (str): The path to the file.
        vault_key (str): key string

    Returns:
        bool: True/False based on execute command.
    """
    cmd = [
        "ansible-vault",
        command,
        file_path,
        "--vault-password-file", vault_key
    ]
    result = subprocess.run(cmd, capture_output=True, text=True, check = True)
    return result.returncode, result.stdout.strip(), result.stderr.strip()

def process_file(file_path, vault_key, mode):
    """
    Encrypt or decrypt a file using Ansible Vault.

    Args:
        file_path (str): The path to the file.
        vault_key (str): The path to the Ansible Vault key.
        mode (str): The mode of operation, either 'encrypt' or 'decrypt'.

    Returns:
        tuple: A tuple containing a boolean indicating whether the
        operation was successful and a message.
    """
    if not os.path.isfile(file_path):
        return False, f"File not found: {file_path}"

    currently_encrypted = is_encrypted(file_path)
    success = False
    message = ""

    if mode == 'encrypt':
        if currently_encrypted:
            success, message = True, f"Already encrypted: {file_path}"
        else:
            code, out, err = run_vault_command('encrypt', file_path, vault_key)
            if code == 0:
                success, message = True, f"Encrypted: {file_path}"
            else:
                message = f"Failed to encrypt {file_path}: {err}"

    elif mode == 'decrypt':
        if not currently_encrypted:
            success, message = True, f"Already decrypted: {file_path}"
        else:
            code, out, err = run_vault_command('decrypt', file_path, vault_key)
            if code == 0:
                success, message = True, f"Decrypted: {file_path}"
            else:
                message = f"Failed to decrypt {file_path}: {err}"
    else:
        message = f"Invalid mode for {file_path}"

    return success, message

def load_pulp_config(path):
    """
    Load Pulp CLI configuration from a TOML file.
 
    Args:
        path (str): Path to the Pulp CLI config file.
 
    Returns:
        dict: A dictionary containing the following keys:
            - username (str): Pulp username
            - password (str): Pulp password (Base64 encoded).
            - base_url (str): Base URL for Pulp API.
    """
    # Securely read file using pathlib
    content = Path(path).read_text(encoding="utf-8")
    config = toml.loads(content)

    cli_config = config.get("cli", {})

    password_plain = cli_config.get("password", "")
    # Encode password using Base64
    password_encoded = base64.b64encode(password_plain.encode()).decode()

    return {
        "username": cli_config.get("username", ""),
        "password": password_encoded,
        "base_url": cli_config.get("base_url", "")
    }

def generate_vault_key(key_path):
    """
    Generate a secure Ansible Vault key
    only if the file does not already exist.

    Args:
        key_path (str): The directory where the Vault key file should be saved.

    Returns:
        str: The full path to the key file, or None if failed.
    """
    if os.path.isfile(key_path):
        return key_path

    try:
        alphabet = string.ascii_letters + string.digits
        key = ''.join(secrets.choice(alphabet) for _ in range(32))

        with open(key_path, "w", encoding="utf-8") as f:
            f.write(key + "\n")

        os.chmod(key_path, stat.S_IRUSR | stat.S_IWUSR)
        return key_path

    except (OSError, IOError) as e:
        return None

def get_arch_from_sw_config(software_name, sw_config_data):
    """
    For a given software, extract architecture list from software_config.json.
    If not found, fallback to arch defined in Groups in functional_groups_config.yml.
    Parameters
       software_name: name of the software
       sw_config_data: json content of software_config.json

    Returns:
        dict: {software_name: [arch list]}
    """
    for software in sw_config_data.get("softwares", []):
        if software.get("name") == software_name:
            arch = software.get("arch")

            # Depricated
            # if arch is None:
            #     # if arch is not defined for given software, fallback to functional_groups_config.yml
            #     return get_arch_from_functional_groups_config(software_name, functional_groups_config_data)

            if isinstance(arch, list) and arch:
                arch_list = [a.strip() for a in arch]
                return {software_name: arch_list}
            else:
                error_msg = f"'arch' field for '{software_name}' should not be an empty list"
                raise ValueError(error_msg)

def get_arch_from_functional_groups_config(software_name, functional_groups_config_data):
    """
    Extract architecture values under each group defined in functional_groups_config.yml
    Parameters
       software_name: name of the software
       functional_groups_config_data: content of functional_groups_config.yml

    Returns:
        dict: {software_name: [archs]}
    """
    archs = []
    groups = functional_groups_config_data.get("Groups", {})

    if not groups:
        error_msg = "No groups defined in functional_groups_config.yml under 'Groups'"
        raise ValueError(error_msg)

    for group_name, group_data in groups.items():
        architecture = group_data.get("architecture")
        if architecture:
            archs.append(architecture.strip())
        else:
            error_msg = f"No architecture defined for group '{group_name}' in functional_groups_config.yml"
            raise ValueError(error_msg)

    return {software_name: archs}


================================================
FILE: common/library/module_utils/local_repo/config.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#pylint: disable=line-too-long

"""
Consolidated configuration file for Ansible module utilities.
"""

# ----------------------------
# Parallel Tasks Defaults
# Used by  parallel_tasks.py
# ----------------------------
DEFAULT_NTHREADS = 4
DEFAULT_TIMEOUT = 60
LOG_DIR_DEFAULT = "/tmp/thread_logs"
DEFAULT_LOG_FILE = "/tmp/task_results_table.log"
DEFAULT_SLOG_FILE = "/tmp/stask_results_table.log"
CSV_FILE_PATH_DEFAULT = [
    "/tmp/x86_64/status_results_table.csv",
    "/tmp/aarch64/status_results_table.csv"
]
DEFAULT_REPO_STORE_PATH = "/tmp/offline_repo"
USER_JSON_FILE_DEFAULT = ""
DEFAULT_STATUS_FILENAME = "status.csv"
STATUS_CSV_HEADER = 'name,type,repo_name,status\n'
SOFTWARE_CSV_HEADER = "name,status"
# USER_REG_CRED_INPUT = "/opt/omnia/input/project_default/user_registry_credential.yml"
# USER_REG_KEY_PATH = "/opt/omnia/input/project_default/.local_repo_credentials_key"
# ----------------------------
# Software tasklist Defaults
# Used by prepare_tasklist.py
# ----------------------------
LOCAL_REPO_CONFIG_PATH_DEFAULT = "/opt/omnia/input/project_default/local_repo_config.yml"
SOFTWARE_CONFIG_PATH_DEFAULT = "/opt/omnia/input/project_default/software_config.json"
SOFTWARE_CSV_FILENAME = "software.csv"
FRESH_INSTALLATION_STATUS = True

# ----------------------------
# Software Utilities Defaults
# Used by software_utils.py
# ----------------------------
PACKAGE_TYPES = ['rpm', 'deb', 'tarball', 'image', 'manifest', 'git',
                 'pip_module', 'deb', 'shell', 'ansible_galaxy_collection', 'iso', 'rpm_list', 'rpm_file', 'rpm_repo']
CSV_COLUMNS = {"column1": "name", "column2": "status"}
SOFTWARE_CONFIG_SUBDIR = "config"
RPM_LABEL_TEMPLATE = "RPMs for {key}"
RHEL_OS_URL = "rhel_os_url"
SOFTWARES_KEY = "softwares"
USER_REPO_URL = "user_repo_url"
ARCH_SUFFIXES = {"x86_64", "aarch64"}
DEFAULT_POLICY = "on_demand"
DEFAULT_CACHING = True
POLICY_CACHING_MAP = {
    ("always", False): "immediate",
    ("always", True): "on_demand",
    ("partial", False): "streamed",
    ("partial", True): "on_demand",
    ("never", False): "streamed",
    ("never", True): "streamed"
}
DNF_COMMANDS = {
    "x86_64": ["dnf", "download", "--resolve", "--alldeps", "--arch=x86_64,noarch", "--disablerepo=*", "--enablerepo=x86_64_*"],
    "aarch64": ["dnf", "download", "--forcearch", "aarch64", "--resolve", "--alldeps", "--exclude=*.x86_64", "--disablerepo=*", "--enablerepo=aarch64_*"]
}
DNF_INFO_COMMANDS = {
    "x86_64": ["dnf", "info", "--quiet"],
    "aarch64": ["dnf", "info", "--quiet", "--forcearch=aarch64"]
}

# ----------------------------
# Cleanup File Types
# Used by pulp_cleanup.py
# ----------------------------
CLEANUP_FILE_TYPES = ["iso", "manifest", "pip_module", "tarball", "git", "ansible_galaxy_collection"]
# ----------------------------
# Used by download_common.py
# ----------------------------
# Pulp command templates
pulp_file_commands = {
    "create_repository": "pulp file repository create --name %s",
    "show_repository": "pulp file repository show --name %s",
    "download_content": "wget -c -O %s %s",
    "content_upload": "pulp file content upload --repository %s --file %s --relative-path %s",
    "publication_create": "pulp file publication create --repository %s",
    "show_distribution": "pulp file distribution show --name %s",
    "distribution_create": "pulp file distribution create --name %s --base-path %s --repository %s",
    "distribution_update": "pulp file distribution update --name %s --base-path %s --repository %s",

    # Cleanup commands
    "delete_repository": "pulp file repository destroy --name %s",
    "delete_distribution": "pulp file distribution destroy --name %s",
    "delete_publication": "pulp file publication destroy --href %s",
    "list_publications": "pulp file publication list --repository %s --limit 1000",
    "list_repositories": "pulp file repository list --limit 1000",
    "list_distributions": "pulp file distribution list --limit 1000",
    "list_content": "pulp file content list --repository-version %s --limit 1000",
    "show_repository_version": "pulp file repository version show --repository %s",
    "orphan_cleanup": "pulp orphan cleanup --protection-time 0"
}

# Pulp Python repository commands (for pip modules)
pulp_python_commands = {
    "list_repositories": "pulp python repository list --limit 1000",
    "show_repository": "pulp python repository show --name %s",
    "delete_repository": "pulp python repository destroy --name %s",
    "list_distributions": "pulp python distribution list --limit 1000",
    "delete_distribution": "pulp python distribution destroy --name %s",
    "orphan_cleanup": "pulp orphan cleanup --protection-time 0"
}

CLI_FILE_PATH = "/root/.config/pulp/cli.toml"
TAR_TIMEOUT_MIN = 45    # minutes
FILE_TIMEOUT_MIN = 1    # minutes
ISO_TIMEOUT_MIN = 45    # minutes
TASK_POLL_INTERVAL = 10  # seconds
FILE_URI = "/pulp/api/v3/content/file/files/"
PULP_SSL_CA_CERT = "/etc/pki/ca-trust/source/anchors/pulp_webserver.crt"
# ----------------------------
# Used by download_image.py
# ----------------------------

pulp_container_commands = {
    "create_container_repo": "pulp container repository create --name %s",
    "show_container_repo": "pulp container repository show --name %s",
    "create_container_remote": "pulp container remote create --name %s --url %s --upstream-name %s --policy %s --include-tags '[\"%s\"]'",
    "create_container_remote_for_digest": "pulp container remote create --name %s --url %s --upstream-name %s --policy %s",
    "create_user_remote_tag": "pulp container remote create --name %s --url %s --upstream-name %s --policy %s --include-tags '[\"%s\"]' --ca-cert %s --client-key %s --tls-validation false",
    "update_user_remote_tag": "pulp container remote update --name %s --url %s --upstream-name %s --policy %s --include-tags '%s' --ca-cert %s --client-key %s --tls-validation false",
    "update_user_remote_digest": "pulp container remote update --name %s --url %s --upstream-name %s --policy %s  --ca-cert %s --client-key %s --tls-validation false",
    "create_user_remote_digest": "pulp container remote create --name %s --url %s --upstream-name %s --policy %s --ca-cert %s --client-key %s --tls-validation false",
    "update_remote_for_digest": "pulp container remote update --name %s --url %s --upstream-name %s --policy %s",
    "update_container_remote": "pulp container remote update --name %s --url %s --upstream-name %s --policy %s --include-tags '%s'",
    "show_container_remote": "pulp container remote show --name %s",
    "show_container_distribution": "pulp container distribution show --name %s",
    "sync_container_repository": "pulp container repository sync --name %s --remote %s",
    "distribute_container_repository": "pulp container distribution create --name %s --repository %s --base-path %s",
    "update_container_distribution": "pulp container distribution update --name %s --repository %s --base-path %s",
    "list_container_remote_tags": "pulp container remote list --name %s --field include_tags",
    "create_container_remote_auth": "pulp container remote create --name %s --url %s --upstream-name %s --policy %s --include-tags '%s' --username %s --password '%s'",
    "update_container_remote_auth": "pulp container remote update --name %s --url %s --upstream-name %s --policy %s --include-tags '%s' --username %s --password '%s'",
    # Cleanup commands
    "delete_repository": "pulp container repository destroy --name %s",
    "delete_remote": "pulp container remote destroy --name %s",
    "delete_distribution": "pulp container distribution destroy --name %s",
    "list_repositories": "pulp container repository list --limit 1000",
    "list_remotes": "pulp container remote list --limit 1000",
    "list_distributions": "pulp container distribution list --limit 1000",
    # Tag-specific cleanup commands
    "get_repo_version": "pulp container repository show --href %s",
    "list_tags_by_version": "pulp show --href /pulp/api/v3/content/container/tags/?repository_version=%s",
    "rename_repository": "pulp container repository update --name %s --new-name %s",
    "orphan_cleanup": "pulp orphan cleanup --protection-time 0",
    "container_distribution_show": "pulp container distribution show --name %s | jq .repository",
    "show_repository_version": "pulp container repository show --href %s | jq .latest_version_href",
    "list_image_tags": "pulp show --href /pulp/api/v3/content/container/tags/?repository_version=%s"
}
OMNIA_CREDENTIALS_YAML_PATH = "/opt/omnia/input/project_default/omnia_config_credentials.yml"
OMNIA_CREDENTIALS_VAULT_PATH = "/opt/omnia/input/project_default/.omnia_config_credentials_key"
# ----------------------------
# Used by process_rpm_config.py
# ----------------------------

# Pulp Concurrency Settings
# Controls the number of concurrent sync/publish operations
PULP_CONCURRENCY = 1  # Default: 1 (most reliable for NFS)

pulp_rpm_commands = {
    "create_repository": "pulp rpm repository create --name %s",
    "pulp_cleanup": "pulp orphan cleanup",
    "show_repository": "pulp rpm repository show --name %s",
    "create_remote": "pulp rpm remote create --name %s --url %s --policy %s",
    "show_remote": "pulp rpm remote show --name %s",
    "update_remote": "pulp rpm remote update --name %s --url %s --policy %s",
    "sync_repository": "pulp rpm repository sync --name %s --remote %s",
    "publish_repository": "pulp rpm publication create --repository %s",
    "distribute_repository": "pulp rpm distribution create --name %s  --base-path %s  --repository %s",
    "update_distribution": "pulp rpm distribution update --name %s  --base-path %s  --repository %s",
    "create_remote_cert": "pulp rpm remote create --name %s --url %s --policy %s --ca-cert %s --client-cert %s --client-key %s",
    "update_remote_cert": "pulp rpm remote update --name %s --url %s --policy %s --ca-cert %s --client-cert %s --client-key %s",
    "check_distribution": "pulp rpm distribution show --name %s",
    "delete_repository": "pulp rpm repository destroy --name %s",
    "delete_remote": "pulp rpm remote destroy --name %s",
    "delete_distribution": "pulp rpm distribution destroy --name %s",
    "list_publications": "pulp rpm publication list --repository %s --limit 1000",
    "update_distribution_publication": "pulp rpm distribution update --name %s --publication %s",
    "check_distribution": "pulp rpm distribution show --name %s",
    "check_publication": "pulp rpm publication list --repository %s --limit 1000",
    "delete_publication": "pulp rpm publication destroy --href %s",
    "get_repo_version": "pulp rpm repository show --name %s",
    "list_repositories": "pulp rpm repository list --limit 1000",
    "list_remotes": "pulp rpm remote list --limit 1000",
    "list_distributions": "pulp rpm distribution list --limit 1000",
    "orphan_cleanup": "pulp orphan cleanup --protection-time 0",
    "list_all_publications": "pulp rpm publication list --limit 1000",
    "upload_content": "pulp rpm content upload --repository %s --file %s",
    "update_distribution_repo_config": "pulp rpm distribution update --name %s --generate-repo-config"
}

# ----------------------------
# Pulp Cleanup Configuration
# Used by pulp_cleanup.py and Ansible modules
# ----------------------------

# Default paths
CLEANUP_BASE_PATH_DEFAULT = "/opt/omnia/log/local_repo"
CLEANUP_STATUS_FILE_PATH_DEFAULT = "/opt/omnia/log/local_repo/cleanup_status.csv"
CLEANUP_LOG_PATH_DEFAULT = "/opt/omnia/log/local_repo/cleanup.log"

# Default cleanup behavior
CLEANUP_DELETE_REMOTE_DEFAULT = True
CLEANUP_DELETE_DISTRIBUTION_DEFAULT = True
CLEANUP_CLEANUP_ORPHANS_AFTER_DEFAULT = True
CLEANUP_LIST_ONLY_DEFAULT = False
CLEANUP_FORCE_DEFAULT = False

# Cleanup status values
CLEANUP_STATUS_SUCCESS = "Success"
CLEANUP_STATUS_FAILED = "Failed"
CLEANUP_STATUS_IN_PROGRESS = "In Progress"

# Cleanup status file settings
CLEANUP_STATUS_FILENAME = "cleanup_status.csv"
CLEANUP_STATUS_CSV_HEADER = "artifact_name,artifact_type,status,message,timestamp\n"
CLEANUP_LOG_FILE_PATH = "/opt/omnia/log/local_repo/cleanup.log"

# ----------------------------
# Additional Repos Aggregation Settings
# Used by process_rpm_config.py for aggregated repos feature
# Naming convention: <arch>_omnia-additional to match existing filter patterns
# ----------------------------
ADDITIONAL_REPOS_KEY = "additional_repos"
AGGREGATED_REPO_NAME_TEMPLATE = "{arch}_omnia-additional"
AGGREGATED_REMOTE_NAME_TEMPLATE = "{arch}_omnia-additional-{name}"
AGGREGATED_DISTRIBUTION_NAME_TEMPLATE = "{arch}_omnia-additional"
AGGREGATED_BASE_PATH_TEMPLATE = "opt/omnia/offline_repo/cluster/{arch}/rhel/{os_version}/rpms/omnia-additional"
STANDARD_LOG_FILE_PATH = "/opt/omnia/log/local_repo/standard.log"

# ----------------------------
# Used by cert_vault_handle.py
# ----------------------------
CERT_KEYS = ["sslcacert", "sslclientkey", "sslclientcert"]

# ----------------------------
# Used by process_metadata.py
# ----------------------------
metadata_rerun_file_path = "/opt/omnia/offline_repo/.data/localrepo_rerun_metadata.yml"


================================================
FILE: common/library/module_utils/local_repo/container_repo_utils.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#pylint: disable=import-error,no-name-in-module

"""
Container repository utilities for Pulp operations.

This module provides functions for creating, syncing, and managing
container repositories and distributions in Pulp.
"""

import multiprocessing
from ansible.module_utils.local_repo.parse_and_download import execute_command
from ansible.module_utils.local_repo.config import (
    pulp_container_commands
)
from ansible.module_utils.local_repo.standard_logger import setup_standard_logger
remote_creation_lock = multiprocessing.Lock()
repository_creation_lock = multiprocessing.Lock()

def create_container_repository(repo_name,logger):
    """
    Creates a container repository.
    Args:
        repo_name (str): The name of the repository.
    Returns:
        bool: True if the repository was created successfully or already exists,
              False if there was an error.
    """
    try:
        if not execute_command(pulp_container_commands["show_container_repo"] % (repo_name),
                              logger):
            command = pulp_container_commands["create_container_repo"] % (repo_name)
            result = execute_command(command,logger)
            logger.info(f"Repository created successfully: {repo_name}")
            return result
        else:
            logger.info(f"Repository {repo_name} already exists.")
            return True
    except Exception as e:
        logger.error(f"Failed to create repository {repo_name}. Error: {e}")
        return False

def extract_existing_tags(remote_name, logger):
    """
    Extracts existing include_tags from a container remote.
    Args:
        remote_name (str): The name of the remote.
    Returns:
        list: A list of existing tags, or an empty list if an error occurs.
    """
    try:
        command = pulp_container_commands["list_container_remote_tags"] % remote_name
        result = execute_command(command, logger, type_json=True)

        if not result or not isinstance(result, dict) or "stdout" not in result:
            logger.error("Failed to fetch remote tags.")
            return []

        remotes = result["stdout"]
        if not isinstance(remotes, list) or len(remotes) == 0:
            logger.error("Unexpected data format for remote tags.")
            return []

        return remotes[0].get("include_tags", [])

    except Exception as e:
        logger.error(f"Error extracting tags: {e}")
        return []

def create_container_distribution(repo_name,package_content,logger):
    """
    Create or update a distribution for a repository.
    Args:
        repo_name (str): The name of the repository.
        package_content (str): The content of the package.
        logger (logging.Logger): The logger instance.
    Returns:
        bool: True if the distribution is created or updated successfully, False otherwise.
    Raises:
        Exception: If there is an error creating or updating the distribution.
    """
    try:
        if not execute_command(pulp_container_commands["show_container_distribution"] % (repo_name),
            logger):
            command = pulp_container_commands["distribute_container_repository"] % (repo_name,
                      repo_name, package_content)
            return execute_command(command,logger)
        else:
            command = pulp_container_commands["update_container_distribution"] % (repo_name,
                      repo_name, package_content)
            return execute_command(command,logger)
    except Exception as e:
        logger.error(f"Error creating distribution {repo_name}: {e}")
        return False

def sync_container_repository(repo_name, remote_name, package_content, logger, tag=None):
    """
    Synchronizes and distribute container repository with a remote.
    Args:
        repo_name (str): The name of the repository.
        remote_name (str): The name of the remote.
        package_content (str): Upstream name.
        logger: Logger instance.
        tag (str, optional): The tag to validate in repository content.
    Returns:
        bool: True if the synchronization is successful, False otherwise.
    """
    try:
        logger.info(f"Getting repository version before sync for {repo_name}")
        verify_command = pulp_container_commands["show_container_repo"] % repo_name
        verify_result_before = execute_command(verify_command, logger, type_json=True)

        version_before = None
        if (verify_result_before and isinstance(verify_result_before, dict) and 
                "stdout" in verify_result_before):
            repo_data_before = verify_result_before["stdout"]
            if isinstance(repo_data_before, dict):
                version_before = repo_data_before.get("latest_version_href")
                logger.info(f"Repository version before sync: {version_before}")

        command = pulp_container_commands["sync_container_repository"] % (repo_name, remote_name)
        result = execute_command(command,logger)
        if result is False or (isinstance(result, dict) and result.get("returncode", 1) != 0):
            logger.error(f"Sync command failed for repository {repo_name}")
            return False

        logger.info(f"Validating sync result for repository {repo_name}")
        verify_result_after = execute_command(verify_command, logger, type_json=True)

        if (verify_result_after and isinstance(verify_result_after, dict) and 
                "stdout" in verify_result_after):
            repo_data_after = verify_result_after["stdout"]
            if isinstance(repo_data_after, dict):
                version_after = repo_data_after.get("latest_version_href")
                logger.info(f"Repository version after sync: {version_after}")

                if not version_after or version_after.endswith("/versions/0/"):
                    logger.error(f"Sync completed but no content was downloaded for {repo_name}. "
                               f"The specified image tag likely does not exist in the upstream registry.")
                    return False

                if version_before and version_after and version_before == version_after:
                    # Check if tag actually exists using precise Pulp commands
                    try:
                        # Step 1: Get distribution to find repository href
                        dist_command = f"pulp container distribution show --name {repo_name}"
                        dist_result = execute_command(dist_command, logger, type_json=True)

                        if not dist_result or not isinstance(dist_result, dict) or "stdout" not in dist_result:
                            logger.info(f"Distribution {repo_name} does not exist yet - skipping tag validation, will create distribution")
                        # Skip tag validation but continue to create distribution at line 221
                        else:
                            # Distribution exists, validate the tag
                            dist_data = dist_result["stdout"]
                            if not isinstance(dist_data, dict) or "repository" not in dist_data:
                                logger.error(f"Invalid distribution data for {repo_name}. Assuming tag doesn't exist.")
                                return False
                            repo_href = dist_data["repository"]
                            logger.info(f"Found repository href: {repo_href}")

                            # Step 2: Get repository version href
                            repo_command = f"pulp container repository show --href {repo_href}"
                            repo_result = execute_command(repo_command, logger, type_json=True)

                            if not repo_result or not isinstance(repo_result, dict) or "stdout" not in repo_result:
                                logger.error(f"Failed to get repository info for {repo_href}. Assuming tag doesn't exist.")
                                return False

                            repo_data = repo_result["stdout"]
                            if not isinstance(repo_data, dict) or "latest_version_href" not in repo_data:
                                logger.error(f"Invalid repository data for {repo_href}. Assuming tag doesn't exist.")
                                return False

                            repo_ver_href = repo_data["latest_version_href"]
                            logger.info(f"Found repository version href: {repo_ver_href}")

                            # Step 3: Check if tag exists in content
                            tags_command = (
                                f"pulp show --href "
                                f"'/pulp/api/v3/content/container/tags/"
                                f"?repository_version={repo_ver_href}'"
                            )
                            tags_result = execute_command(tags_command, logger, type_json=True)

                            if not tags_result or not isinstance(tags_result, dict) or "stdout" not in tags_result:
                                logger.error(f"Failed to get content tags for {repo_ver_href}. Assuming tag doesn't exist.")
                                return False

                            tags_data = tags_result["stdout"]
                            if not isinstance(tags_data, dict) or "results" not in tags_data:
                                logger.error(f"Invalid tags data for {repo_ver_href}. Assuming tag doesn't exist.")
                                return False

                            tags = tags_data["results"]
                            tag_exists = False

                            # Use the tag parameter if provided, otherwise fall back to checking package_content
                            tag_to_check = tag if tag else package_content

                            for tag_item in tags:
                                if isinstance(tag_item, dict) and "name" in tag_item and tag_item["name"] == tag_to_check:
                                    tag_exists = True
                                    break

                            if tag_exists:
                                logger.info(f"Tag '{tag_to_check}' already exists in Pulp repository {repo_name}. No sync needed - image is already available.")
                            else:
                                logger.error(f"Sync completed but repository version did not change for {repo_name}. "
                                        f"Version remained at {version_after}. "
                                        f"Tag '{tag_to_check}' does not exist in Pulp repository content. "
                                        f"This indicates the tag likely does not exist in the upstream registry.")
                                return False
                            
                    except Exception as e:
                        logger.error(
                            f"Error checking repository tag existence: {e}. Assuming tag doesn't exist."
                        )
                        return False

                logger.info(
                    f"Sync validation successful: repository {repo_name} version changed "
                    f"from {version_before} to {version_after}"
                )
        result = create_container_distribution(repo_name, package_content, logger)
        return result
    except Exception as e:
        logger.error(f"Failed to synchronize repository {repo_name} with remote {remote_name}. Error: {e}")
        return False


================================================
FILE: common/library/module_utils/local_repo/download_common.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# pylint: disable=import-error,line-too-long,no-name-in-module,too-many-return-statements,too-many-statements,too-many-arguments,too-many-branches,too-many-locals

"""
Handle pulp file downloads for local repository
"""
import base64
import json
import os
import shlex
import shutil
import subprocess
import tarfile
import time
from multiprocessing import Lock
from urllib.parse import urlparse
import requests
from jinja2 import Template
from requests.adapters import HTTPAdapter
from urllib3.util.retry import Retry
from ansible.module_utils.local_repo.parse_and_download import write_status_to_file,execute_command
from ansible.module_utils.local_repo.rest_client import RestClient
from ansible.module_utils.local_repo.common_functions import load_pulp_config
from ansible.module_utils.local_repo.config import (
    pulp_file_commands,
    pulp_rpm_commands,
    CLI_FILE_PATH,
    ISO_TIMEOUT_MIN,
    TAR_TIMEOUT_MIN,
    FILE_TIMEOUT_MIN,
    TASK_POLL_INTERVAL,
    FILE_URI,
    PULP_SSL_CA_CERT
)

file_lock = Lock()
CHUNK_SIZE = 10 * 1024 * 1024  # 10MB
MAX_RETRY = 5  # retry resume up to 5 times

def download_file_distribution(distribution_name, dl_directory, relative_path, logger):
    """
    Download a file from a given distribution and save it locally.

    Args:
        distribution_name (str): Name of the distribution from which the file will be downloaded.
        dl_directory (str): Local directory path where the downloaded file should be stored.
        relative_path (str): Relative path of the file in the distribution.
        logger (logging.Logger): Logger instance for logging download progress, success, or errors.

    Returns:
        str: "Success" if the download is completed successfully.

    Raises:
        subprocess.CalledProcessError: If the file download command fails.
        Exception: For any other unexpected errors encountered during execution.
    """

    def is_safe_url(url: str) -> bool:
        parsed = urlparse(url)
        return parsed.scheme in ("http", "https") and bool(parsed.netloc)

    def sanitize_path(path: str) -> str:
        safe_path = os.path.normpath(path)
        if ".." in safe_path:
            raise ValueError("Invalid path traversal detected")
        return safe_path

    try:
        cmd = ["pulp", "file", "distribution", "show", "--name", distribution_name]
        result = subprocess.run(cmd, check=True, capture_output=True, text=True)
        data = json.loads(result.stdout)

        base_url = data.get("base_url")
        if not base_url:
            logger.error(f"base_url not found for {distribution_name}")
            return "Failed"

        full_url = base_url.rstrip("/") + "/" + relative_path
        if not is_safe_url(full_url):
            logger.error(f"Unsafe URL: {full_url}")
            return "Failed"

        local_path = sanitize_path(os.path.join(dl_directory, relative_path))
        os.makedirs(os.path.dirname(local_path), exist_ok=True)

        retry = 0
        while retry <= MAX_RETRY:

            downloaded_bytes = os.path.getsize(local_path) if os.path.exists(local_path) else 0
            headers = {"Range": f"bytes={downloaded_bytes}-"} if downloaded_bytes > 0 else {}

            session = requests.Session()
            session.mount("https://", HTTPAdapter(max_retries=3))

            try:
                logger.info(f"Attempt {retry+1}: Downloading from byte {downloaded_bytes}")

                with session.get(
                    full_url,
                    stream=True,
                    headers=headers,
                    verify=PULP_SSL_CA_CERT,
                    timeout=(30, 600)
                ) as r:

                    if r.status_code == 416:
                        logger.info("File already complete. No download needed.")
                        return "Success"

                    if r.status_code not in (200, 206):
                        logger.error(f"HTTP error: {r.status_code}")
                        raise Exception("Bad status code")

                    total = int(r.headers.get("Content-Length", 0))
                    total_size = downloaded_bytes + total

                    mode = "ab" if downloaded_bytes else "wb"

                    with open(local_path, mode) as f:
                        current = downloaded_bytes
                        for chunk in r.iter_content(chunk_size=CHUNK_SIZE):
                            if not chunk:
                                continue
                            f.write(chunk)
                            current += len(chunk)
                            logger.info(f"Progress: {round((current/total_size)*100, 2)}% ({current}/{total_size} bytes)")

                # Final size check
                if os.path.getsize(local_path) == total_size:
                    logger.info(f"Download completed successfully: {local_path}")
                    return "Success"
                else:
                    raise Exception("File size mismatch after download")

            except Exception as e:
                logger.error(f"Download interrupted: {e}")
                retry += 1
                wait = 5 * retry
                logger.info(f"Retrying in {wait} seconds...")
                time.sleep(wait)

        logger.error("Max retries exceeded, download failed.")
        return "Failed"

    except Exception as e:
        logger.error(f"Unexpected failure: {e}")
        return "Failed"

def wait_for_task(task_href, base_url, username, password, logger, timeout=3600, interval=3):
    """
    Polls a Pulp task until it reaches a terminal state: completed, failed, or canceled.

    Args:
        task_href (str): Relative URL to the task
        base_url (str): Base URL of the Pulp server
        username (str): Username for basic auth.
        password (str): Password for basic auth.
        logger (logging.Logger): Logger instance.
        timeout (int): Max time to wait in seconds. Default is 3600 (1 hour).
        interval (int): Polling interval in seconds. Default is 3.

    Returns:
        bool: True if task completed successfully, False if failed, canceled, or timeout.
    """
    rest_client = RestClient(base_url, username, password)

    parsed_base = base_url.rstrip('/')
    if task_href.startswith(parsed_base):
        uri = task_href[len(parsed_base):]
    else:
        uri = task_href

    start = time.time()

    while (time.time() - start) < timeout:
        task = rest_client.get(uri)
        if task is None:
            logger.error(f"Failed to get task info from {uri}")
            return False

        state = task.get("state", "unknown")
        if state == "completed":
            return True
        if state in ("failed", "canceled"):
            return False

        time.sleep(interval)

    logger.error("Timeout waiting for task to complete")
    return False

def handle_file_upload(repository_name, relative_path, file_url, timeout_minutes, logger):
    """
    Ensure repository exists, then POST a file to Pulp and wait for the task to complete.

    Args:
        repository_name (str): Name of the repository.
        relative_path (str): Relative path for the file in the repository.
        file_url (str): URL of the file to upload.
        timeout_minutes (int): Maximum time in minutes to wait for task completion.
        logger (logging.Logger): Logger instance.

    Returns:
        str: "Success" if operation completes successfully, "Failed" otherwise.
    """
    # Check if repository exists
    result = execute_command(pulp_file_commands["show_repository"] % repository_name, logger)
    if not result:
        logger.info(f"Repository {repository_name} does not exist. Creating it...")
        if not execute_command(pulp_file_commands["create_repository"] % repository_name, logger):
            logger.error(f"Failed to create repository: {repository_name}")
            return "Failed"
    else:
        logger.info(f"Repository {repository_name} already exists.")

    # Fetch repository info with JSON parsing
    result = execute_command(pulp_file_commands["show_repository"] % repository_name,
                            logger, type_json=True)
    if not result:
        logger.error(f"Failed to fetch repository info for: {repository_name}")
        return "Failed"

    repo_info = result["stdout"]
    pulp_href = repo_info.get("pulp_href")

    # Load config for authentication and base_url
    config = load_pulp_config(CLI_FILE_PATH)
    base_url = config["base_url"]
    passcode = base64.b64decode(config["password"].encode()).decode()

    # Initialize RestClient
    logger.info("Initializing RestClient for POST request...")
    client = RestClient(base_url, config["username"], passcode)

    data = {
        "file_url": file_url,
        "relative_path": relative_path,
        "repository": pulp_href
    }
    logger.info(f"Sending POST request to upload file from '{file_url}' to repository '{repository_name}'...")
    response = client.post(FILE_URI, data)

    if not response:
        logger.error(f"Failed to POST file to repository {repository_name}.")
        return "Failed"

    task_href = response.get("task")
    if not task_href:
        logger.error("Task href not found in POST response.")
        return "Failed"

    # Wait for task completion
    timeout_seconds = timeout_minutes * 60
    logger.info(f"Waiting for task {task_href} to complete (timeout: {timeout_minutes} min)...")
    task_result = wait_for_task(task_href, base_url, config["username"], passcode,
                               logger, timeout=timeout_seconds, interval=TASK_POLL_INTERVAL)
    if task_result:
        logger.info(f"File successfully uploaded to repository '{repository_name}'.")
        return "Success"
    else:
        logger.error(f"Task {task_href} failed or timed out. File upload to repository '{repository_name}' failed.")
        return "Failed"

def handle_post_request(repository_name, relative_path, base_path, file_url, timeout_minutes,logger):
    """
    Handles the full Pulp upload and distribution process for a given repository and file.
    Args:
        repository_name (str): Name of the Pulp repository.
        relative_path (str): Path where the file should be stored inside the repository.
        base_path (str): The base path for the distribution.
        file_url (str): URL of the file to be uploaded.
        timeout_minutes (int): Maximum time in minutes to wait for upload task completion.
        logger (logging.Logger): Logger for logging messages and errors.

    Returns:
        str: "Success" if the operation completes successfully, "Failed" otherwise.
    """
    result = handle_file_upload(repository_name, relative_path, file_url, timeout_minutes,logger)
    if result =="Success":
        distribution_name = repository_name
        logger.info("Creating publication...")
        if not execute_command(pulp_file_commands["publication_create"] % (repository_name),
                              logger):
            logger.error(f"Failed to create publication for repository: {repository_name}")
            result = "Failed"

        logger.info("Checking distribution...")
        if not execute_command(pulp_file_commands["show_distribution"] % (distribution_name),
                              logger):
            logger.info(f"Distribution {distribution_name} does not exist. Creating it...")
            if not execute_command(pulp_file_commands["distribution_create"] % (distribution_name, base_path, repository_name), logger):
                logger.error(f"Failed to create distribution: {distribution_name}")
                result = "Failed"
        else:
            logger.info(f"Distribution {distribution_name} already exists. Updating it...")
            if not execute_command(pulp_file_commands["distribution_update"] % (distribution_name, base_path, repository_name), logger):
                logger.error(f"Failed to update distribution: {distribution_name}")
                result = "Failed"
    return result

def process_file(repository_name, output_file, relative_path,
                base_path, distribution_name, url, file_path, logger):
    """
    Process a file using Pulp, ensuring it is downloaded and stored in the specified file_path.

    Args:
        repository_name (str): Name of the Pulp repository.
        output_file (str): Name of the output file.
        relative_path (str): Relative path for the file in Pulp.
        base_path (str): Base path for the distribution.
        distribution_name (str): Name of the distribution.
        url (str): URL of the file to be downloaded.
        file_path (str): Path where the file should be stored.
        logger (logging.Logger): Logger instance for logging.

    Returns:
        str: "Success" if the process is successful, otherwise "Failed".
    """
    logger.info("#" * 30 + f" {process_file.__name__} start " + "#" * 30)  # Start of function
    status = "Success"
    try:
        logger.info(f"Processing file: {url}")
        # Step 1: Check if the file exists in the file path; download if not
        logger.info("Step 1: Checking if the file exists in the manifest path...")
        if os.path.exists(file_path):
            logger.info(f"File already exists: {file_path}. Skipping download.")
        else:
            logger.info("File does not exist. Downloading file...")
            download_command = pulp_file_commands["download_content"] % (file_path, url)
            if not execute_command(download_command, logger):
                logger.error(f"Failed to download the file: {url}")
                return "Failed"
            logger.info(f"File downloaded to: {file_path}")
        # Step 2: Check if the repository exists; create if not
        logger.info("Step 2: Checking repository...")
        if not execute_command(pulp_file_commands["show_repository"] % (repository_name), logger):
            logger.info(f"Repository {repository_name} does not exist. Creating it...")
            if not execute_command(pulp_file_commands["create_repository"] % (repository_name),
                                  logger):
                logger.error(f"Failed to create repository: {repository_name}")
                return "Failed"
        else:
            logger.info(f"Repository {repository_name} already exists.")
        # Step 3: Upload the content to the repository
        logger.info("Step 3: Uploading content...")
        if not execute_command(pulp_file_commands["content_upload"] % (repository_name, file_path, relative_path), logger):
            logger.error(f"Failed to upload content to repository: {repository_name}")
            return "Failed"
        # Step 4: Create a publication
        logger.info("Step 4: Creating publication...")
        if not execute_command(pulp_file_commands["publication_create"] % (repository_name),
                              logger):
            logger.error(f"Failed to create publication for repository: {repository_name}")
            return "Failed"
        # Step 5: Check if the distribution exists
        logger.info("Step 5: Checking distribution...")
        if not execute_command(pulp_file_commands["show_distribution"] % (distribution_name),
                              logger):
            logger.info(f"Distribution {distribution_name} does not exist. Creating it...")
            if not execute_command(pulp_file_commands["distribution_create"] % (distribution_name, base_path, repository_name), logger):
                logger.error(f"Failed to create distribution: {distribution_name}")
                return "Failed"
        else:
            logger.info(f"Distribution {distribution_name} already exists. Updating it...")
            if not execute_command(pulp_file_commands["distribution_update"] % (distribution_name, base_path, repository_name), logger):
                logger.error(f"Failed to update distribution: {distribution_name}")
                return "Failed"
        logger.info(f"Processing for file {url} completed successfully!")
        return status
    except Exception as e:
        logger.error(f"Error processing file: {e}")
        return "Failed"
    finally:
        logger.info("#" * 30 + f" {process_file.__name__} end " + "#" * 30)  # End of function

def process_file_without_download(repository_name, output_file, relative_path,
                                 base_path, distribution_name, url, file_path, logger):
    """
    Process a file using Pulp, ensuring it is stored in the specified file_path.
    Args:
        repository_name (str): Name of the Pulp repository.
        output_file (str): Name of the output file.
        relative_path (str): Relative path for the file in Pulp.
        base_path (str): Base path for the distribution.
        distribution_name (str): Name of the distribution.
        url (str): URL of the file to be downloaded.
        file_path (str): Path where the file should be stored.
        logger (logging.Logger): Logger instance for logging.
    Returns:
        str: "Success" if the process is successful, otherwise "Failed".
    """
    logger.info("#" * 30 + f" {process_file_without_download.__name__} start " + "#" * 30)
    status = "Success"
    try:
        logger.info(f"Processing file: {url}")
        # Step 1: Check if the repository exists; create if not
        logger.info("Step 1: Checking repository...")
        if not execute_command(pulp_file_commands["show_repository"] % (repository_name), logger):
            logger.info(f"Repository {repository_name} does not exist. Creating it...")
            if not execute_command(pulp_file_commands["create_repository"] % (repository_name),
                                  logger):
                logger.error(f"Failed to create repository: {repository_name}")
                return "Failed"
        else:
            logger.info(f"Repository {repository_name} already exists.")

        # Step 2: Upload the content to the repository
        logger.info("Step 2: Uploading content...")
        if not execute_command(pulp_file_commands["content_upload"] % (repository_name, file_path, relative_path),
                              logger):
            logger.error(f"Failed to upload content to repository: {repository_name}")
            return "Failed"

        # Step 3: Create a publication
        logger.info("Step 3: Creating publication...")
        if not execute_command(pulp_file_commands["publication_create"] % (repository_name),
                              logger):
            logger.error(f"Failed to create publication for repository: {repository_name}")
            return "Failed"

        # Step 4: Check if the distribution exists
        logger.info("Step 4: Checking distribution...")
        if not execute_command(pulp_file_commands["show_distribution"] % (distribution_name), logger):
            logger.info(f"Distribution {distribution_name} does not exist. Creating it...")
            if not execute_command(pulp_file_commands["distribution_create"] % (distribution_name, base_path, repository_name), logger):
                logger.error(f"Failed to create distribution: {distribution_name}")
                return "Failed"
        else:
            logger.info(f"Distribution {distribution_name} already exists. Updating it...")
            if not execute_command(pulp_file_commands["distribution_update"] % (distribution_name, base_path, repository_name), logger):
                logger.error(f"Failed to update distribution: {distribution_name}")
                return "Failed"
        logger.info(f"Processing for file {url} completed successfully!")
        return status

    except Exception as e:
        logger.error(f"Error processing file: {e}")
        return "Failed"
    finally:
        logger.info("#" * 30 + f" {process_file_without_download.__name__} end " + "#" * 30)

def process_manifest(file,repo_store_path, status_file_path, cluster_os_type, cluster_os_version, arc,logger):
    """
    Process a manifest file.
    Args:
        file (dict): The file to process.
        repo_store_path (str): The path to the repository store.
        status_file_path (str): The path to the status file.
        logger (logging.Logger): The logger.
    Returns:
        str: The status of the processing.
    Raises:
        Exception: If an error occurs.    
    """
    logger.info("#" * 30 + f" {process_manifest.__name__} start " + "#" * 30)  # Start of function
    try:
        # Extract file details
        package_name = file["package"]
        url = file.get('url', None)
        url = shlex.quote(url).strip("'\"")
        package_type = file["type"]

        # Using wget to check if the URL exists (returns 0 for success, non-zero for failure)
        subprocess.run(['wget', '-q', '--spider', '--tries=1', url], check=True)

        # Ensure the manifest directory exists
        manifest_directory = os.path.join(repo_store_path, "offline_repo", "cluster",arc.lower(), cluster_os_type, cluster_os_version, "manifest", package_name)
        # # Determine the manifest file path
        file_path = os.path.join(manifest_directory, f"{package_name}.yaml")
        repository_name = arc.lower() + "_manifest" + package_name
        output_file =  package_name + ".yml"
        relative_path = output_file
        base_path = manifest_directory.strip("/")
        status = handle_post_request(repository_name, relative_path,
                 base_path, url, FILE_TIMEOUT_MIN, logger)
    except Exception as e:
        logger.error(f"Error processing manifest: {e}")
        status= "Failed"
    finally:
        # Write the status to the file
        if status == "Success":
            os.makedirs(manifest_directory, exist_ok =True)
            status = download_file_distribution(repository_name, manifest_directory,
                                                relative_path, logger)
        write_status_to_file(status_file_path, package_name, package_type,
                             status, logger, file_lock)
        logger.info("#" * 30 + f" {process_manifest.__name__} end " + "#" * 30)  # End of function
        return status

def process_git(file,repo_store_path, status_file_path, cluster_os_type, cluster_os_version, arc,logger):
    """
    Process a Git package.
    Args:
        file (dict): A dictionary containing the package information.
        repo_store_path (str): The path to the repository store.
        status_file_path (str): The path to the status file.
        logger (logging.Logger): The logger instance.
    Returns:
        str: The status of the Git package processing.
    Raises:
        subprocess.CalledProcessError: If an error occurs while executing Git commands.
        Exception: If an error occurs while processing the Git package.
    """
    logger.info("#" * 30 + f" {process_git.__name__} start " + "#" * 30)  # Start of function
    try:
        package_name = file['package']
        package_name = shlex.quote(package_name).strip("'\"")

        url = file.get('url', None)
        url = shlex.quote(url).strip("'\"")
        version = file.get('version', None)
        version = shlex.quote(version).strip("'\"")

        package_type = file['type']
        logger.info(f"Processing Git Package: {package_name}, URL: {url}, Version: {version}")

        # Assuming you have a specific path to store Git packages
        git_modules_directory = os.path.join(repo_store_path, "offline_repo", 'cluster',arc.lower(), cluster_os_type, cluster_os_version, 'git', package_name)
        os.makedirs(git_modules_directory, exist_ok=True)  # Ensure the directory exists

        clone_directory = os.path.join(git_modules_directory, package_name)
        clone_directory = shlex.quote(clone_directory).strip("'\"")
        tarball_path = os.path.join(git_modules_directory, f'{package_name}.tar.gz')
        repository_name = arc.lower() + "_git" + package_name
        output_file = package_name + ".tar.gz"
        relative_path = output_file
        base_path = git_modules_directory.strip("/")
        distribution_name = repository_name

        # Step 1: Clone the repository and create a tarball
        logger.info("Step 1: Cloning repository and creating tarball...")
        if not os.path.exists(clone_directory):
            clone_command = ['git', 'clone', '--branch', version, url, clone_directory]
            subprocess.run(clone_command, check=True)

            # Create a tarball of the cloned repository in the same directory
            with tarfile.open(tarball_path, 'w:gz') as tar:
                tar.add(clone_directory, arcname=package_name)

        else:
            logger.info(f"Git repository {file['package']} already cloned. Skipping clone.")

        # Step 2: Process the downloaded git tarball file using Pulp commands
        logger.info("Step 2: Processing git tarball with Pulp...")
        status = "Success"
        status = process_file_without_download(repository_name, output_file, relative_path,
                 base_path, distribution_name, url, tarball_path,logger)

    except subprocess.CalledProcessError as e:
        logger.error(f"Error executing Git commands: {e}")
        status= "Failed"
    except Exception as e:
        logger.error(f"Error processing Git package: {e}")
        status= "Failed"

    finally:
        # Write the status to the file
        write_status_to_file(status_file_path, package_name, package_type,
                             status, logger, file_lock)

        logger.info("#" * 30 + f" {process_git.__name__} end " + "#" * 30)  # End of function
        return status

# Function to process a shell file
def process_shell(file,repo_store_path, status_file_path,  cluster_os_type, cluster_os_version, arc,logger):
    """
    Process a shell package.

    Args:
        file (dict): A dictionary containing the package information.
        repo_store_path (str): The path to the repository store.
        status_file_path (str): The path to the status file.
        logger (logging.Logger): The logger instance.

    Returns:
        str: The status of the shell package processing.

    Raises:
        Exception: If an error occurs while processing the shell package.
    """
    logger.info("#" * 30 + f" {process_shell.__name__} start " + "#" * 30)  # Start of function
    try:
        package_name = file['package']
        url = file.get('url', None)
        package_type = file['type']
        logger.info(f"Processing sh Package: {package_name}, URL: {url}")

        # Creating the local path to save the sh file
        sh_directory = os.path.join(repo_store_path, "offline_repo", 'cluster',arc.lower(), cluster_os_type, cluster_os_version, 'shell', package_name)
        os.makedirs(sh_directory, exist_ok=True)  # Ensure the directory exists

        sh_path = os.path.join(sh_directory, f"{package_name}.sh")
        repository_name = arc.lower() + "_shell" + package_name
        output_file = package_name + ".sh"
        relative_path = output_file
        base_path = sh_directory.strip("/")
        distribution_name = repository_name
        status = "Success"
        status = process_file(repository_name, output_file, relative_path,
                 base_path, distribution_name, url, sh_path, logger )
    except Exception as e:
        logger.error(f"Error processing shell: {e}")
        status = "Failed"

    finally:
        # Write the status to the file
        write_status_to_file(status_file_path, package_name, package_type, status, logger, file_lock)
        logger.info("#" * 30 + f" {process_shell.__name__} end " + "#" * 30)  # End of function
        return status

def process_ansible_galaxy_collection(file, repo_store_path, status_file_path, cluster_os_type, cluster_os_version, arc, logger):
    """
    Process an Ansible Galaxy Collection.

    Args:
        file (dict): A dictionary containing the package information.
        repo_store_path (str): The path to the repository store.
        status_file_path (str): The path to the status file.
        logger (logging.Logger): The logger instance.
    Returns:
        str: The status of the Ansible Galaxy Collection processing.
    Raises:
        subprocess.CalledProcessError: If an error occurs while executing ansible-galaxy commands.
        Exception: If an error occurs while processing the Ansible Galaxy Collection.
    """
    logger.info("#" * 30 + f" {process_ansible_galaxy_collection.__name__} start " + "#" * 30)
    try:
        package_name = file['package']
        version = file.get('version', None)

        package_name = shlex.quote(package_name).strip("'\"")
        version = shlex.quote(version).strip("'\"")

        package_type = file['type']
        logger.info(
            f"Processing Ansible Galaxy Collection Package: {package_name}, Version: {version}"
        )

        # Assuming you have a specific path to store Ansible Galaxy Collections
        galaxy_collections_directory = os.path.join(repo_store_path, "offline_repo", 'cluster', arc.lower(), cluster_os_type, cluster_os_version, 'ansible_galaxy_collection', package_name)
        galaxy_collections_directory = shlex.quote(galaxy_collections_directory).strip("'\"")
        os.makedirs(galaxy_collections_directory, exist_ok=True)  # Ensure the directory exists
        collections_tarball_path = os.path.join(galaxy_collections_directory, f'{package_name.replace(".", "-")}-{version}.tar.gz')
        repository_name = arc.lower() + "_ansible_galaxy_collection" + package_name
        output_file = f"{file['package'].replace('.', '-')}-{file['version']}.tar.gz"
        relative_path = output_file
        base_path = galaxy_collections_directory.strip("/")
        distribution_name = repository_name

        logger.info(f"Processing Ansible Galaxy Collection: {file['package']}")

        # Check if the tarball already exists

        if os.path.exists(collections_tarball_path):
            logger.info(
                f"Ansible Galaxy Collection {package_name}:{version} already exists at {collections_tarball_path}. Skipping download."
            )
            logger.info("Processing the Ansible Galaxy collection tarball with Pulp...")
            status = "Success"
            status = process_file_without_download(repository_name, output_file, relative_path,
                     base_path, distribution_name, file["package"], collections_tarball_path, logger)
        else:
            # Example: Using subprocess.run with ansible-galaxy command to download the collection
            download_command = [
            'ansible-galaxy',
            'collection',
            'download',
            f'{package_name}:{version}',
            f'--download-path={galaxy_collections_directory}']
            try:
                subprocess.run(download_command, check=True)
                logger.info(
                    f"Ansible Galaxy Collection {package_name}:{version} downloaded successfully."
                )
                 # Process the downloaded tarball file using Pulp commands
                logger.info("Processing the Ansible Galaxy collection tarball with Pulp...")
                status = "Success"
                status = process_file_without_download(repository_name, output_file, relative_path,
                         base_path, distribution_name, file["package"], collections_tarball_path, logger)

            except subprocess.CalledProcessError:
                logger.error(
                    f"Error: Unable to download Ansible Galaxy Collection {package_name}:{version}"
                )
                status = "Failed"
            except Exception as e:
                logger.error(f"Error processing ansible-galaxy-collection: {e}")
                status = "Failed"

    except subprocess.CalledProcessError as e:
        logger.error(f"Error executing ansible-galaxy commands: {e}")
        status = "Failed"
    except Exception as e:
        logger.error(f"Error processing Ansible Galaxy collection: {e}")
        status = "Failed"

    finally:
        # Write the status to the file
        write_status_to_file(status_file_path, package_name, package_type, status, logger, file_lock)

        logger.info("#" * 30 + f" {process_ansible_galaxy_collection.__name__} end " + "#" * 30)
        return status

def process_tarball(package, repo_store_path, status_file_path, version_variables, cluster_os_type, cluster_os_version, arc, logger):
    """
    Process a tarball package.

    Args:
        package (dict): The package information.
        repo_store_path (str): The path to the repository store.
        status_file_path (str): The path to the status file.
        version_variables (dict): The version variables.
        logger (logging.Logger): The logger.

    Returns:
        str: The status of the operation.
    """
    logger.info("#" * 30 + f" {process_tarball.__name__} start " + "#" * 30)  # Start of function

    path = None
    url = None
    path_support = False
    url_support = True
    package_template = Template(package.get('package', None))  # Use Jinja2 Template for package
    package_name = package_template.render(**version_variables)
    package_type = package['type']
    if 'url' in package:
        url_template = Template(package.get('url', None))  # Use Jinja2 Template for URL
        # Render the URL, substituting Jinja variables if present
        url = url_template.render(**version_variables)
    if 'path' in package:
        path = package['path']

    logger.info(f"Processing Tarball Package: {package_name}, URL: {url}, Path: {path}")
    url = shlex.quote(url).strip("'\"")

    if path is not None and len(path) > 1:
        if os.path.isfile(path):
            path_support = True
            url_support = False

    # Creating the local path to save the tarball
    tarball_directory = os.path.join(repo_store_path, "offline_repo", 'cluster', arc.lower(), cluster_os_type, cluster_os_version, 'tarball', package_name)

    logger.info(f"Processing tarball to directory: {tarball_directory}")

    # Use the package name for the tarball filename
    tarball_path = os.path.join(tarball_directory, f"{package_name}.tar.gz")
    tarball_path = shlex.quote(tarball_path).strip("'\"")

    repository_name = arc.lower() + "_tarball" + package_name
    output_file = package_name + ".tar.gz"
    relative_path = output_file
    base_path = tarball_directory.strip("/")
    distribution_name = repository_name
    # This just makes the request look like a real browser request,
    # preventing some servers from blocking it
    agent = "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/132.0.0.0 Safari/537.36"

    if path_support is False and url_support is True:
        try:
            # Using wget to check if the URL exists (returns 0 for success, non-zero for failure)
            subprocess.run(['wget', '-q', '--spider', '--tries=1','--user-agent',agent, url], check=True)
            if url:
                try:
                    status = handle_post_request(repository_name, relative_path,
                             base_path, url, TAR_TIMEOUT_MIN,logger)
                except Exception as e:
                    logger.error(f"Error processing tarball: {e}")
                    status = "Failed"
                finally:
                    # Write the status to the file
                    if status == "Success":
                        os.makedirs(tarball_directory, exist_ok =True)
                        status = download_file_distribution(distribution_name, tarball_directory, relative_path, logger)
                    write_status_to_file(status_file_path, package_name, package_type, status, logger, file_lock)
                    logger.info("#" * 30 + f" {process_tarball.__name__} end " + "#" * 30)  # End of function

                    return status
            else:
                status = "No URL provided"
        except subprocess.CalledProcessError:
            logger.error(f"Error: Package {package_name} not found at {url}")
            status = "Failed"
        finally:
            write_status_to_file(status_file_path, package_name, package_type, status, logger, file_lock)
            logger.info("#" * 30 + f" {process_tarball.__name__} end " + "#" * 30)  # End of function

            return status
    elif path_support is True and url_support is False:
        try:
            shutil.copy(path, tarball_path)
            status = "Success"
            status = process_file_without_download(repository_name, output_file, relative_path,
                     base_path, distribution_name, package_name, tarball_path, logger)
        except subprocess.CalledProcessError as e:
            logger.error(f"Error executing tarball commands: {e}")
            status = "Failed"
        except Exception as e:
            logger.error(f"Error processing tarball: {e}")
            status = "Failed"
        finally:
            # Write the status to the file
            write_status_to_file(status_file_path, package_name, package_type, status, logger, file_lock)
            logger.info("#" * 30 + f" {process_tarball.__name__} end " + "#" * 30)  # End of function

            return status

def process_iso(package, repo_store_path, status_file_path,
               cluster_os_type, cluster_os_version, version_variables, arc, logger):
    """
    Process an ISO package.

    Args:
        package (dict): A dictionary containing the package information.
        repo_store_path (str): The path to the repository store.
        status_file_path (str): The path to the status file.
        cluster_os_type (str): The type of the cluster operating system.
        cluster_os_version (str): The version of the cluster operating system.
        version_variables (dict): A dictionary of version variables.
        logger (logging.Logger): The logger instance.

    Returns:
        str: The status of the ISO package processing.

    Raises:
        subprocess.CalledProcessError: If an error occurs while executing iso commands.
        Exception: If an error occurs while processing the ISO package.
    """
    logger.info("#" * 30 + f" {process_iso.__name__} start " + "#" * 30)  # Start of function
    path = None
    url = None
    path_support = False
    url_support = True
    package_name = package['package']
    package_type = package['type']
    repository_name = arc.lower() + "_iso" + package_name

    distribution_name = repository_name
    if 'url' in package:
        url_template = Template(package.get('url', None))  # Use Jinja2 Template for URL
        # Render the URL, substituting Jinja variables if present
        url = url_template.render(**version_variables)
    if 'path' in package:
        path = package['path']

    logger.info(f"Processing iso Package: {package_name}, URL: {url}, Path: {path}")

    if path is not None and len(path) > 1:
        if os.path.isfile(path):
            path_support = True
            url_support = False

    iso_directory = os.path.join(repo_store_path, "offline_repo", 'cluster', arc.lower(), cluster_os_type, cluster_os_version, 'iso', package_name)
    base_path = iso_directory.strip("/")
    logger.info(f"Processing iso Package to directory: {iso_directory}")

    if path_support is False and url_support is True:
        try:
            download_file_name = url.split('/')
            logger.info(f"Download file name: {download_file_name[-1]}")
            iso_file_path = os.path.join(iso_directory, download_file_name[-1])
            output_file = download_file_name[-1]
            relative_path = output_file
            # Check if the file already exists
            if os.path.exists(iso_file_path):
                logger.info(f"ISO Package {package_name} already exists at {iso_directory}")
                status = "Success"
            else:
                # Using wget to check if the URL exists (returns 0 for success,
                # non-zero for failure)
                subprocess.run(['wget', '-q', '--spider', '--tries=1', url], check=True)
                status = handle_post_request(repository_name, relative_path,
                         base_path, url, ISO_TIMEOUT_MIN,logger)
        except subprocess.CalledProcessError as e:
            logger.error(f"Error executing iso commands: {e}")
            status = "Failed"
        except Exception as e:
            logger.error(f"Error processing iso: {e}")
            status = "Failed"
        finally:
            if status == "Success":
                os.makedirs(iso_directory, exist_ok =True)
                status = download_file_distribution(distribution_name, iso_directory,
                         relative_path, logger)
            # Write the status to the file
            write_status_to_file(status_file_path, package_name, package_type, status, logger, file_lock)
            logger.info("#" * 30 + f" {process_iso.__name__} end " + "#" * 30)  # End of function
            return status

    elif path_support is True and url_support is False:
        try:
            shutil.copy(path, iso_directory)
            download_file_name = path.split('/')
            iso_file_path = os.path.join(iso_directory, download_file_name[-1])
            output_file = download_file_name[-1]
            relative_path = output_file
            # Process the iso file using Pulp commands
            logger.info("Processing iso with Pulp...")
            status = "Success"
            status = process_file_without_download(repository_name, output_file, relative_path,
                            base_path, distribution_name, package_name, iso_file_path, logger)
        except subprocess.CalledProcessError as e:
            logger.error(f"Error executing iso commands: {e}")
            status = "Failed"
        except Exception as e:
            logger.error(f"Error processing iso: {e}")
            status = "Failed"
        finally:
            # Write the status to the file
            write_status_to_file(status_file_path, package_name, package_type, status, logger, file_lock)
            logger.info("#" * 30 + f" {process_iso.__name__} end " + "#" * 30)  # End of function
            return status

def process_pip(package, repo_store_path, status_file_path,  cluster_os_type, cluster_os_version, arc,logger):
    """
    Process a pip package using Pulp.

    Args:
        package (dict): Package info with 'package' (name) and optional 'version'.
        repo_store_path (str): Path to store the downloaded package.
        status_file_path (str): Path to log processing status.

    Returns:
        str: "Success" if the process is successful, otherwise "Failed".
    """
    logger.info("#" * 30 + f" {process_pip.__name__} start " + "#" * 30)
    status = "Success"  # Default status, updated if any step fails

    try:
        package_name = shlex.quote(package['package']).strip("'\"")
        package_type = package['type']
        version = package.get('version', None)
        pip_repo = arc.lower() + "_pip_module" + package_name
        distribution_name = pip_repo

        logger.info(f"Processing Pip Package: {package_name}, Version: {version}")

        # Define storage path
        pip_package_directory = os.path.join(repo_store_path, "offline_repo", 'cluster',arc.lower(), cluster_os_type, cluster_os_version, 'pip_module', package_name)
        base_package_directory = os.path.join(repo_store_path, "offline_repo", 'cluster', arc.lower(), cluster_os_type, cluster_os_version,'pip_module', package_name)
        base_package_directory = base_package_directory.strip("/")

        os.makedirs(pip_package_directory, exist_ok=True)  # Ensure directory exists

        # Step 1: Download the package
        logger.info("Step 1: Downloading package...")
        download_command = f"pip download -d {shlex.quote(pip_package_directory)} {package_name}"
        if version:
            download_command += f"=={version}"

        if not execute_command(download_command, logger):
            status = "Failed"
            logger.error(f"Failed to download {package_name}. Aborting process.")
            return status  # Stop further steps

        # Step 2: Create the Pulp repository if it does not exist
        logger.info("Step 2: Checking repository existence...")
        if not execute_command(f"pulp python repository show --name {pip_repo}", logger):
            logger.info(f"Repository {pip_repo} does not exist. Creating it...")
            if not execute_command(f"pulp python repository create --name {pip_repo}", logger):
                status = "Failed"
                logger.error(f"Failed to create repository {pip_repo}. Aborting process.")
                return status  # Stop further steps

        # Step 3: Upload the package(s) to Pulp
        logger.info("Step 3: Uploading package to Pulp...")
        for whl_file in os.listdir(pip_package_directory):
            whl_path = os.path.join(pip_package_directory, whl_file)
            if whl_file.endswith(".whl"):
                relative_path = whl_file  # Keep the filename as-is
                upload_command = f"pulp python content upload --repository {pip_repo} --file {whl_path} --relative-path {relative_path}"
                if not execute_command(upload_command, logger):
                    status = "Failed"
                    logger.error(f"Failed to upload {whl_file} to {pip_repo}. Aborting process.")
                    return status  # Stop further steps

        # Step 4: Publish the repository
        logger.info("Step 4: Publishing the repository...")
        if not execute_command(f"pulp python publication create --repository {pip_repo}", logger):
            status = "Failed"
            logger.error(f"Failed to publish repository {pip_repo}. Aborting process.")
            return status  # Stop further steps

        # Step 5: Create or update the distribution
        logger.info("Step 5: Configuring distribution...")
        if not execute_command(f"pulp python distribution show --name {distribution_name}", logger):
            logger.info(f"Distribution {distribution_name} does not exist. Creating it...")
            if not execute_command(f"pulp python distribution create --name {distribution_name} --repository {pip_repo} --base-path {base_package_directory}", logger):
                status = "Failed"
                logger.error(
                    f"Failed to create distribution {distribution_name}. Aborting process."
                )
                return status  # Stop further steps
        else:
            logger.info("Updating existing distribution...")
            if not execute_command(f"pulp python distribution update --name {distribution_name} --repository {pip_repo} --base-path {base_package_directory}", logger):
                status = "Failed"
                logger.error(
                    f"Failed to update distribution {distribution_name}. Aborting process."
                )
                return status  # Stop further steps

        logger.info(f"Package {package_name} processed successfully!")

    except Exception as e:
        logger.error(f"Unexpected error while processing {package_name}: {str(e)}")
        status = "Failed"

    finally:
        # Write status to file
        write_status_to_file(status_file_path, package_name, package_type, status, logger, file_lock)

        logger.info("#" * 30 + f" {process_pip.__name__} end " + "#" * 30)
        return status

def process_rpm_file(package, repo_store_path, status_file_path, cluster_os_type, cluster_os_version, arc, logger):
    """
    Process an RPM file package by downloading it and setting up a Pulp RPM repository.

    Args:
        package (dict): A dictionary containing the package information.
        repo_store_path (str): The path to the repository store.
        status_file_path (str): The path to the status file.
        cluster_os_type (str): The type of the cluster operating system.
        cluster_os_version (str): The version of the cluster operating system.
        arc (str): The architecture (x86_64 or aarch64).
        logger (logging.Logger): The logger instance.

    Returns:
        str: The status of the RPM file package processing.
    """
    logger.info("#" * 30 + f" {process_rpm_file.__name__} start " + "#" * 30)

    try:
        package_name = package['package']
        url = package.get('url', None)
        package_type = package['type']
        repo_name = arc.lower() + "_" + package_name

        if not url:
            logger.error(f"No URL provided for RPM file package: {package_name}")
            status = "Failed"
            write_status_to_file(status_file_path, package_name, package_type, status, logger, file_lock, repo_name)
            return status

        url = shlex.quote(url).strip("'\"")
        logger.info(f"Processing RPM File Package: {package_name}, URL: {url}")

        # Create rpm_file directory structure
        rpm_file_directory = os.path.join(
            repo_store_path, "offline_repo", "cluster", arc.lower(),
                        cluster_os_type, cluster_os_version, "rpm_file", package_name
        )
        os.makedirs(rpm_file_directory, exist_ok=True)

        # Extract filename from URL
        download_file_name = url.split('/')[-1]
        rpm_file_path = os.path.join(rpm_file_directory, download_file_name)

        # Step 1: Download the RPM file
        logger.info("Step 1: Downloading RPM file...")
        if os.path.exists(rpm_file_path):
            logger.info(f"RPM file already exists: {rpm_file_path}")
        else:
            # Verify URL exists
            subprocess.run(['wget', '-q', '--spider', '--tries=1', url], check=True)

            # Download the file
            download_command = f"wget -O {shlex.quote(rpm_file_path)} {url}"
            if not execute_command(download_command, logger):
                logger.error(f"Failed to download RPM file from: {url}")
                status = "Failed"
                write_status_to_file(status_file_path, package_name, package_type, status, logger, file_lock, repo_name)
                return status

        # Step 2: CREATE A NEW RPM REPOSITORY IN PULP (if it doesn't exist)
        logger.info("Step 2: Creating RPM repository in Pulp...")
        # Check if repository already exists
        if execute_command(pulp_rpm_commands["show_repository"] % repo_name, logger):
            logger.info(f"RPM repository {repo_name} already exists. Skipping creation.")
        else:
            logger.info(f"Creating RPM repository: {repo_name}")
            if not execute_command(pulp_rpm_commands["create_repository"] % repo_name, logger):
                logger.error(f"Failed to create RPM repository: {repo_name}")
                status = "Failed"
                write_status_to_file(status_file_path, package_name, package_type, status, logger, file_lock, repo_name)
                return status

        # Step 3: UPLOAD THE RPM INTO THE REPO
        logger.info("Step 3: Uploading RPM to repository...")
        upload_command = pulp_rpm_commands["upload_content"] % (repo_name, shlex.quote(rpm_file_path))
        if not execute_command(upload_command, logger):
            logger.error(f"Failed to upload RPM to repository: {repo_name}")
            status = "Failed"
            write_status_to_file(status_file_path, package_name, package_type, status, logger, file_lock, repo_name)
            return status

        # Step 4: PUBLISH THE REPOSITORY
        logger.info("Step 4: Publishing repository...")
        if not execute_command(pulp_rpm_commands["publish_repository"] % repo_name, logger):
            logger.error(f"Failed to publish repository: {repo_name}")
            status = "Failed"
            write_status_to_file(status_file_path, package_name, package_type, status, logger, file_lock, repo_name)
            return status

        # Step 5: CREATE A DISTRIBUTION FOR THE REPO (if it doesn't exist)
        logger.info("Step 5: Creating distribution...")
   
        # Check if distribution already exists
        if execute_command(pulp_rpm_commands["check_distribution"] % repo_name, logger):
            logger.info(f"Distribution {repo_name} already exists. Skipping creation.")
        else:
            logger.info(f"Creating distribution: {repo_name}")
            # Get the publication href
            pub_result = execute_command(pulp_rpm_commands["list_all_publications"], logger, type_json=True)
            if not pub_result or not pub_result.get("stdout"):
                logger.error("Failed to get publication list")
                status = "Failed"
                write_status_to_file(status_file_path, package_name, package_type, status, logger, file_lock, repo_name)
                return status

            publications = pub_result["stdout"]
            if not publications:
                logger.error("No publications found")
                status = "Failed"
                write_status_to_file(status_file_path, package_name, package_type, status, logger, file_lock, repo_name)
                return status

            latest_publication = publications[0]
            publication_href = latest_publication.get("pulp_href")
            
            if not publication_href:
                logger.error("No publication href found")
                status = "Failed"
                write_status_to_file(status_file_path, package_name, package_type, status, logger, file_lock, repo_name)
                return status

            base_path = f" opt/omnia/offline_repo/cluster/{arc}/rhel/{cluster_os_version}/rpms/{repo_name}"
            dist_create_command = pulp_rpm_commands["distribute_repository"] % (repo_name, base_path, repo_name)
            if not execute_command(dist_create_command, logger):
                logger.error(f"Failed to create distribution: {repo_name}")
                status = "Failed"
                write_status_to_file(status_file_path, package_name, package_type, status, logger, file_lock, repo_name)
                return status

        # Step 6: ENABLE AUTO-GENERATION OF .repo FILES
        logger.info("Step 6: Enabling auto-generation of .repo files...")
        update_command = pulp_rpm_commands["update_distribution_repo_config"] % repo_name
        if not execute_command(update_command, logger):
            logger.warning(f"Failed to enable repo config generation for: {repo_name}")
            # Not a critical failure, continue

        logger.info(f"RPM file package {package_name} processed successfully!")
        status = "Success"

    except subprocess.CalledProcessError as e:
        logger.error(f"Error executing RPM file commands: {e}")
        status = "Failed"
    except Exception as e:
        logger.error(f"Error processing RPM file package: {e}")
        status = "Failed"

    finally:
        # Write the status to the file
        write_status_to_file(status_file_path, package_name, package_type, status, logger, file_lock, repo_name)
        logger.info("#" * 30 + f" {process_rpm_file.__name__} end " + "#" * 30)
        return status

================================================
FILE: common/library/module_utils/local_repo/download_image.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

# pylint: disable=import-error,no-name-in-module,too-many-branches,too-many-positional-arguments,too-many-arguments,too-many-locals
"""This module handles mirroring of container images in the local repository."""

import re
import json
from multiprocessing import Lock
from jinja2 import Template
from ansible.module_utils.local_repo.standard_logger import setup_standard_logger
from ansible.module_utils.local_repo.parse_and_download import execute_command,write_status_to_file
from ansible.module_utils.local_repo.user_image_utility import handle_user_image_registry
from ansible.module_utils.local_repo.config import (
    pulp_container_commands,
    OMNIA_CREDENTIALS_YAML_PATH,
    OMNIA_CREDENTIALS_VAULT_PATH
)
from ansible.module_utils.local_repo.container_repo_utils import (
    create_container_repository,
    extract_existing_tags,
    sync_container_repository,
    create_container_distribution,
    repository_creation_lock,
    remote_creation_lock
)
import yaml

file_lock = Lock()

def create_container_remote_with_auth(remote_name, remote_url, package, policy_type,
                                     tag, logger, docker_username, docker_password):
    """
    Create a container remote with authentication.

    Creates a new container remote or updates an existing one with the provided tag
    and authentication credentials.

    Parameters:
        remote_name (str): Name of the container remote.
        remote_url (str): URL of the container remote.
        package (str): Package name.
        policy_type (str): Policy type.
        tag (str): Tag to add to the container remote.
        logger (object): Logger instance.
        docker_username (str): Docker username.
        docker_password (str): Docker password.

    Returns:
        bool: True if the container remote was created or updated successfully, False otherwise.
    """
    try:
        remote_exists = execute_command(pulp_container_commands["show_container_remote"] % remote_name, logger)
        if not remote_exists:
            tags_json = json.dumps([tag])  # --> '["1.25.2-alpine"]'
            create_command = pulp_container_commands["create_container_remote_auth"] % (
            remote_name,remote_url,package,policy_type,tags_json,docker_username,docker_password)

            result = execute_command(create_command, logger)
            if result:
                logger.info(f"Remote '{remote_name}' created successfully with auth.")
                return True
            else:
                logger.error(f"Failed to create remote '{remote_name}' with auth.")
                return False
        else:
            logger.info(f"Remote '{remote_name}' already exists. Checking tags.")
            existing_tags = extract_existing_tags(remote_name, logger)
            if tag in existing_tags:
                logger.info(f"Tag '{tag}' already exists. No update needed.")
                return True

            new_tags = existing_tags + [tag]
            tags_str = json.dumps(new_tags)

            update_command = pulp_container_commands["update_container_remote_auth"] % (
                remote_name, remote_url, package, policy_type, tags_str,
                docker_username, docker_password
            )
            result = execute_command(update_command, logger)
            if result:
                logger.info(
                    f"Remote '{remote_name}' updated successfully with auth and tags: {new_tags}"
                )
                return True
            else:
                logger.error(f"Failed to update remote '{remote_name}' with auth.")
                return False

    except Exception as error:
        logger.error(f"Error in create/update remote '{remote_name}' with auth: {error}")
        return False


def create_container_remote(remote_name, remote_url, package, policy_type, tag, logger):
    """
    Creates or updates a container remote with the specified tag.

    If the remote does not exist, it is created with the provided tag. If the remote
    already exists, the function retrieves the current tags, checks if the new tag is
    already included, and updates the remote if necessary.

    Args:
        remote_name (str): The name of the container remote.
        remote_url (str): The URL of the container remote.
        package (str): The upstream package name.
        policy_type (str): The policy type for the remote (e.g., "immediate" or "on_demand").
        tag (str): The tag to be added to the include_tags list.
        logger (Logger): Logger instance for logging messages.

    Returns:
        bool: True if the remote was successfully created or updated, False otherwise.
    """
    try:
        # Check if the remote exists
        remote_exists = execute_command(pulp_container_commands["show_container_remote"] % remote_name, logger)
        if not remote_exists:
            # If remote does not exist, create it with the provided tag
            command = pulp_container_commands["create_container_remote"] % (
                remote_name, remote_url, package, policy_type, tag
            )
            result = execute_command(command, logger)
            if result:
                logger.info(f"Remote '{remote_name}' created successfully.")
                return True
            else:
                logger.error(f"Failed to create remote '{remote_name}'.")
                return False
        else:
            logger.info(f"Remote '{remote_name}' already exists. Updating include_tags.")
            # Retrieve existing tags
            existing_tags = extract_existing_tags(remote_name, logger)
            # If the tag already exists, no update is needed
            if tag in existing_tags:
                logger.info(
                    f"Tag '{tag}' already exists for remote '{remote_name}'. No update needed."
                )
                return True
            # Append new tag and update
            new_tags = existing_tags + [tag]
            tags_json = json.dumps(new_tags)  # Ensuring proper JSON formatting
            update_command = pulp_container_commands["update_container_remote"] % (
                remote_name, remote_url, package, policy_type, tags_json
            )
            result = execute_command(update_command, logger)
            if result:
                logger.info(f"Remote '{remote_name}' updated successfully with tags: {new_tags}")
                return True
            else:
                logger.error(f"Failed to update remote '{remote_name}'.")
                return False

    except Exception as error:
        logger.error(f"Error in create/update remote '{remote_name}': {error}")
        return False

def create_container_remote_digest(remote_name, remote_url, package, policy_type, logger):
    """
    Creates a container remote for a given package.
    Args:
        remote_name (str): The name of the remote.
        remote_url (str): The URL of the remote.
        package (str): The package to create the remote for.
        policy_type (str): The policy type for the remote.
    Returns:
        bool: True if the remote was created or updated successfully, False otherwise.
    Raises:
        Exception: If there was an error creating or updating the remote.
    """
    try:
        if not execute_command(pulp_container_commands["show_container_remote"] % (remote_name), logger):
            command = pulp_container_commands["create_container_remote_for_digest"] % (remote_name, remote_url, package, policy_type)
            result = execute_command(command,logger)
            logger.info(f"Remote created successfully: {remote_name}")
            return result
        else:
            logger.info(f"Remote {remote_name} already exists.")
            command = pulp_container_commands["update_remote_for_digest"] % (remote_name, remote_url, package, policy_type)
            result = execute_command(command,logger)
            logger.info(f"Remote updated successfully: {remote_name}")
            return True
    except Exception as e:
        logger.error(f"Failed to create remote {remote_name}. Error: {e}")
        return False

def get_repo_url_and_content(package):
    """
    Get the repository URL and content from a given package.
    Parameters:
        package (str): The package to extract the URL and content from.
    Returns:
        tuple: A tuple containing the repository URL and content.
    Raises:
        ValueError: If the package prefix is not supported.
    """
    patterns = {
        r"^(ghcr\.io)(:\d+)?(/.+)": "https://ghcr.io",
        r"^(docker\.io)(:\d+)?(/.+)": "https://registry-1.docker.io",
        r"^(quay\.io)(:\d+)?(/.+)": "https://quay.io",
        r"^(registry\.k8s\.io)(:\d+)?(/.+)": "https://registry.k8s.io",
        r"^(nvcr\.io)(:\d+)?(/.+)": "https://nvcr.io",
        r"^(public\.ecr\.aws)(:\d+)?(/.+)": "https://public.ecr.aws",
        r"^(gcr\.io)(:\d+)?(/.+)": "https://gcr.io",
    }
    for pattern, repo_url in patterns.items():
        match = re.match(pattern, package)
        if match:
            base_url = repo_url

            # If user provided a port, preserve it
            if match.group(2):
                base_url = f"{repo_url}{match.group(2)}"

            package_content = match.group(3).lstrip("/")
            return base_url, package_content

    # fallback for private / IP-based registries
    match = re.match(r"^(?P<registry>[^/]+)(?P<path>/.*)$", package)
    if match:
        return f"https://{match.group('registry')}", match.group("path").lstrip("/")

    raise ValueError(f"Invalid package format: {package}")


# def get_repo_url_and_content(package):
#     """
#     Get the repository URL and content from a given package.
#     Parameters:
#         package (str): The package to extract the URL and content from.
#     Returns:
#         tuple: A tuple containing the repository URL and content.
#     Raises:
#         ValueError: If the package prefix is not supported.
#     """
#     patterns = {
#          r"^(ghcr\.io)(/.+)": "https://ghcr.io",
#          r"^(docker\.io)(/.+)": "https://registry-1.docker.io",
#          r"^(quay\.io)(/.+)": "https://quay.io",
#          r"^(registry\.k8s\.io)(/.+)": "https://registry.k8s.io",
#          r"^(nvcr\.io)(/.+)": "https://nvcr.io",
#          r"^(public\.ecr\.aws)(/.+)": "https://public.ecr.aws",
#          r"^(gcr\.io)(/.+)": "https://gcr.io"
#     }
#     for pattern, repo_url in patterns.items():
#         match = re.match(pattern, package)
#         if match:
#             base_url = repo_url
#             package_content = match.group(2).lstrip("/")  # Remove leading slash
#             return base_url, package_content

#     raise ValueError(f"Unsupported package prefix for package: {package}")

def process_image(package, status_file_path, version_variables,
                 user_registries,docker_username, docker_password, logger):
    """
    Process an image.
    Args:
        package (dict): The package to process.
        repo_store_path (str): The path to the repository store.
        status_file_path (str): The path to the status file.
        cluster_os_type (str): The type of the cluster operating system.
        cluster_os_version (str): The version of the cluster operating system.
        user_registry_flag (bool): if image needs to be processed from user_registry
        logger (Logger): The logger.
    Returns:
        str: "Success" if the image was processed successfully, "Failed" otherwise.
    """
    logger.info("#" * 30 + f" {process_image.__name__} start " + "#" * 30)
    status = "Success"
    result =False
    policy_type = "immediate"
    base_url, package_content = get_repo_url_and_content(package['package'])
    package_identifier = None

    # Only check user registries for additional_packages
    if user_registries and "additional_packages" in status_file_path:
        result, package_identifier = handle_user_image_registry(
            package,
            package_content,
            version_variables,
            user_registries,
            logger
        )

        if not result:
            logger.info(f"Image {package['package']} will not be synced to Pulp.")
            status = "Failed"
            return status
        
        else:
            logger.info(f"Image {package['package']} synced to Pulp.")
            status = "Success"
            return status

    try:
        repo_name_prefix = "container_repo_"
        repository_name = f"{repo_name_prefix}{package['package'].replace('/', '_').replace(':', '_')}"
        remote_name = f"remote_{package['package'].replace('/', '_').replace(':', '_')}"
        package_identifier = package['package']

        # Create container repository
        with repository_creation_lock:
            result = create_container_repository(repository_name, logger)
        if result is False or (isinstance(result, dict) and result.get("returncode", 1) != 0):
            raise Exception(f"Failed to create repository: {repository_name}")

        # Process digest or tag
        if "digest" in package:
            package_identifier += f":{package['digest']}"
            result = create_container_remote_digest(
                remote_name, base_url, package_content, policy_type, logger
            )
            if result is False or (isinstance(result, dict) and result.get("returncode", 1) != 0):
                raise Exception(f"Failed to create remote digest: {remote_name}")

        elif "tag" in package:
            tag_template = Template(package['tag'])
            tag_val = tag_template.render(**version_variables)
            package_identifier += f":{package['tag']}"

            with remote_creation_lock:
                if package['package'].startswith('docker.io/') and docker_username and docker_password:
                    result = create_container_remote_with_auth(
                        remote_name, base_url, package_content, policy_type,
                        tag_val, logger, docker_username, docker_password
                    )
                else:
                    result = create_container_remote(
                        remote_name, base_url, package_content, policy_type, tag_val, logger
                    )

            if result is False or (isinstance(result, dict) and result.get("returncode", 1) != 0):
                raise Exception(f"Failed to create remote: {remote_name}")

        # Sync and distribute
        # Pass tag_val if it exists (for tag-based images), otherwise None (for digest-based images)
        tag_to_pass = tag_val if "tag" in package else None
        result = sync_container_repository(
            repository_name, remote_name, package_content, logger, tag=tag_to_pass
        )
        if result is False or (isinstance(result, dict) and result.get("returncode", 1) != 0):
            raise Exception(f"Failed to sync repository: {repository_name}")

    except Exception as e:
        status = "Failed"
        logger.error(f"Failed to process image: {package_identifier}. Error: {e}")

    write_status_to_file(
        status_file_path, package_identifier, package['type'], status, logger, file_lock
    )
    logger.info("#" * 30 + f" {process_image.__name__} end " + "#" * 30)
    return status


================================================
FILE: common/library/module_utils/local_repo/download_rpm.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

# pylint: disable=import-error,no-name-in-module,too-many-positional-arguments,too-many-arguments
"""This module handles downloading RPM files for local repository"""

import subprocess
import os
import shutil
from pathlib import Path
from ansible.module_utils.local_repo.config import (
    DNF_COMMANDS,
    DNF_INFO_COMMANDS
)
from multiprocessing import Lock
from ansible.module_utils.local_repo.parse_and_download import write_status_to_file, _prefix_repo_name_with_arch

file_lock = Lock()

def process_rpm(package, repo_store_path, status_file_path, cluster_os_type,
               cluster_os_version, repo_config_value, arc, logger):
    """
        Downloads RPMs using DNF based on repo configuration, retries failures,
        writes status to file, and returns overall status: Success, Partial, or Failed.
    Args:
            package (dict): Package info with "package" name and "rpm_list".
            repo_store_path (str): Local path to store downloaded RPMs.
            status_file_path (str): CSV path to record RPM download status.
            cluster_os_type (str): OS type (e.g., "rhel").
            cluster_os_version (str): OS version (e.g., "9.2").
            repo_config_value (str): Repo mode: "always", "partial"
            arc (str): Architecture ("x86_64" or "aarch64").
            logger (Logger): Logger instance.

        Returns:
            str: "Success", "Partial", or "Failed".
    """

    logger.info("#" * 30 + f" {process_rpm.__name__} start " + "#" * 30)

    try:
        # Get repo_mapping for individual RPM repo names
        repo_mapping = package.get("repo_mapping", {})

        if repo_config_value == "always":
            rpm_list = list(set(package["rpm_list"]))
            logger.info(f"{package['package']} - List of rpms is {rpm_list}")

            sw_json_name = Path(status_file_path).parent.name
            logger.info(f"Software rpms : {sw_json_name}")

            rpm_directory = os.path.join(
                repo_store_path, 'offline_repo',
                'cluster', arc.lower(), cluster_os_type, cluster_os_version, 'rpm', sw_json_name
            )
            logger.info(f"rpm_dir {rpm_directory}")
            os.makedirs(rpm_directory, exist_ok=True)

            arch_key = "x86_64" if arc.lower() in ("x86_64") else "aarch64"

           # First try to download all at once
            dnf_download_command = (
                DNF_COMMANDS[arch_key]
                + [f"--destdir={rpm_directory}"]
                + rpm_list
            )

            result = subprocess.run(
                dnf_download_command,
                check=False,
                capture_output=True,
                text=True
            )
            logger.info(f"Return code {result.returncode}")
            logger.debug(f"STDOUT:\n{result.stdout}")
            logger.debug(f"STDERR:\n{result.stderr}")

            stdout_lines = result.stdout.splitlines()
            stderr_lines = result.stderr.splitlines()

            downloaded = []
            failed = []

            # Detect successes/failures from combined run
            for pkg in rpm_list:
                # Get repo_name for this specific RPM from mapping
                pkg_repo_name = repo_mapping.get(pkg, "")
                # Check if package was downloaded successfully
                # Look for "Already downloaded" or actual .rpm file in output
                pkg_downloaded = False
                for line in stdout_lines + stderr_lines:
                    if pkg in line and (".rpm" in line or "Already downloaded" in line):
                        pkg_downloaded = True
                        break

                # Also check for "No match for argument" or "No package" errors
                pkg_not_found = False
                for line in stderr_lines:
                    if pkg in line and ("No match for argument" in line or 
                                       "No package" in line or
                                       "not found" in line.lower()):
                        pkg_not_found = True
                        break

                if pkg_downloaded and not pkg_not_found:
                    downloaded.append(pkg)
                    write_status_to_file(status_file_path, pkg, "rpm", "Success", logger, file_lock, pkg_repo_name)
                else:
                    failed.append(pkg)
                    if pkg_not_found:
                        logger.warning(f"Package '{pkg}' not found in configured repositories")

            # Retry failed ones individually
            if failed:
                logger.warning(f"Retrying failed packages individually: {failed}")
                for pkg in failed[:]:
                    cmd = DNF_COMMANDS[arch_key] + [f'--destdir={rpm_directory}', pkg]
                    retry_res = subprocess.run(cmd, check=False, capture_output=True, text=True)
                    # Get repo_name for this specific RPM from mapping
                    pkg_repo_name = repo_mapping.get(pkg, "")

                    # Check for package not found errors
                    retry_stderr = retry_res.stderr.lower()
                    pkg_invalid = any(err in retry_stderr for err in [
                        "no match for argument",
                        "no package",
                        "not found",
                        "unable to find a match"
                    ])

                    if retry_res.returncode == 0 and ".rpm" in retry_res.stdout + retry_res.stderr:
                        downloaded.append(pkg)
                        failed.remove(pkg)
                        write_status_to_file(status_file_path, pkg, "rpm", "Success", logger, file_lock, pkg_repo_name)
                        logger.info(f"Package '{pkg}' downloaded successfully on retry.")
                    else:
                        write_status_to_file(status_file_path, pkg, "rpm", "Failed", logger, file_lock, pkg_repo_name)
                        if pkg_invalid:
                            logger.error(f"Package '{pkg}' does not exist in configured repositories.")
                        else:
                            logger.error(f"Package '{pkg}' still failed after retry.")

            # Determine final status
            if not failed:
                status = "Success"
            elif downloaded:
                status = "Partial"
            else:
                status = "Failed"

        else:
            logger.info("RPM won't be downloaded when repo_config is partial or never")
            logger.info("Validating package availability using dnf info...")

            arch_key = "x86_64" if arc.lower() in ("x86_64") else "aarch64"
            valid_packages = []
            invalid_packages = []

            for pkg in package["rpm_list"]:
                # Get repo_name for this specific RPM from mapping
                pkg_repo_name = repo_mapping.get(pkg, "")
                
                # Validate package using dnf info with specific repo only
                if pkg_repo_name:
                    # Apply architecture prefixing if needed
                    prefixed_repo_name = _prefix_repo_name_with_arch(pkg_repo_name, status_file_path, logger)
                    dnf_info_command = DNF_INFO_COMMANDS[arch_key] + [
                        f"--repo={prefixed_repo_name}",  # Search specific repo from JSON
                        pkg
                    ]
                else:
                    # Skip validation if no specific repo is defined
                    logger.warning(f"No repo_name defined for package '{pkg}', skipping validation")
                    continue
                result = subprocess.run(
                    dnf_info_command,
                    check=False,
                    capture_output=True,
                    text=True
                )
                if result.returncode == 0:
                    # Package exists and is available
                    valid_packages.append(pkg)
                    write_status_to_file(
                        status_file_path, pkg, "rpm", "Success", 
                        logger, file_lock, pkg_repo_name
                    )
                    logger.info(f"Package '{pkg}' validated successfully")
                else:
                    # Package not found or invalid
                    invalid_packages.append(pkg)
                    write_status_to_file(
                        status_file_path, pkg, "rpm", "Failed", 
                        logger, file_lock, pkg_repo_name
                    )
                    logger.error(
                        f"Package '{pkg}' validation failed. "
                        f"Package may not exist in repository '{prefixed_repo_name}'."
                    )

            # Determine final status based on validation results
            if not invalid_packages:
                status = "Success"
            elif valid_packages:
                status = "Partial"
            else:
                status = "Failed"

            logger.info(
                f"Validation complete - Valid: {len(valid_packages)}, "
                f"Invalid: {len(invalid_packages)}"
            )

    except Exception as e:
        logger.error(f"Exception occurred: {e}")
        status = "Failed"
        for pkg in package.get("rpm_list", []):
            # Get repo_name for this specific RPM from mapping
            pkg_repo_name = repo_mapping.get(pkg, "")
            write_status_to_file(status_file_path, pkg, "rpm", "Failed", logger, file_lock, pkg_repo_name)

    finally:
        logger.info(f"Overall status for {package['package']}: {status}")
        logger.info("#" * 30 + f" {process_rpm.__name__} end " + "#" * 30)
        return status


================================================
FILE: common/library/module_utils/local_repo/parse_and_download.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# pylint: disable=import-error,no-name-in-module
"""
Utility functions for parsing and downloading artifacts.

This module provides common functions for command execution, status file management,
and repository operations used across the local repo management system.
"""

import os
import subprocess
import json
import re
from multiprocessing import Lock
from ansible.module_utils.local_repo.config import ARCH_SUFFIXES, STATUS_CSV_HEADER


def mask_sensitive_data(cmd_string):
    """
    Masks sensitive data in command strings such as passwords, usernames, and tokens.
    """
    cmd_string = re.sub(r'(--password\s+)([^\s]+)', r'\1******', cmd_string)
    cmd_string = re.sub(r'(--username\s+)([^\s]+)', r'\1******', cmd_string)
    cmd_string = re.sub(r'(--token\s+)([^\s]+)', r'\1******', cmd_string)
    return cmd_string

def execute_command(cmd_string, logger, type_json=False):
    """
    Executes a shell command and captures the output (both stdout and stderr).

    Args:
        cmd_string (str): The shell command to execute.
        logger (logging.Logger): Logger instance for logging the process and errors.
        type_json (bool): If True, attempts to parse stdout as JSON.

    Returns:
        dict or bool: Command execution details or False on failure.
    """
    logger.info("#" * 30 + f" {execute_command.__name__} start " + "#" * 30)
    status = {}

    try:
        # Mask sensitive info before logging
        safe_cmd_string = mask_sensitive_data(cmd_string)
        logger.info(f"Executing command: {safe_cmd_string}")

        # Run the command
        cmd = subprocess.run(
            cmd_string,
            universal_newlines=True,
            stdout=subprocess.PIPE,
            stderr=subprocess.PIPE,
            shell=True,
        )
        status["returncode"] = cmd.returncode
        status["stdout"] = cmd.stdout.strip() if cmd.stdout else None
        status["stderr"] = cmd.stderr.strip() if cmd.stderr else None

        if cmd.returncode != 0:
            logger.error(f"Command failed with return code {cmd.returncode}")
            logger.error(f"Error: {status['stderr']}")
            return False

        if type_json:
            if not status["stdout"]:
                logger.error("Command succeeded but returned empty output when JSON was expected")
                return False
            try:
                status["stdout"] = json.loads(status["stdout"])
            except json.JSONDecodeError as error:
                logger.error(f"Failed to parse JSON output: {error}")
                logger.error(f"Raw output was: {status['stdout']}")
                return False

        logger.info(f"Command succeeded: {safe_cmd_string}")
        return status
    except subprocess.CalledProcessError as e:
        logger.error(f"Command failed: {safe_cmd_string} - {e}")
        return False
    except subprocess.TimeoutExpired as e:
        logger.error(f"Command timed out: {safe_cmd_string} - {e}")
        return False
    except OSError as e:
        logger.error(f"OS error during command: {safe_cmd_string} - {e}")
        return False

    finally:
        logger.info("#" * 30 + f" {execute_command.__name__} end " + "#" * 30)

def get_arch_from_status_path(status_file_path):
    """Extract architecture from status file path.
    
    Args:
        status_file_path: Path like '/opt/omnia/log/local_repo/x86_64/software_name/status.csv'
        
    Returns:
        str: Architecture ('x86_64' or 'aarch64') or None if not found
    """
    for arch in ARCH_SUFFIXES:
        if f"/{arch}/" in status_file_path:
            return arch
    return None

def _prefix_repo_name_with_arch(repo_name: str, status_file_path: str, logger) -> str:
    """Add architecture prefix to repo_name if not already present.
    
    Args:
        repo_name: Repository name to prefix
        status_file_path: Path to extract architecture from
        logger: Logger instance
        
    Returns:
        str: Repository name with architecture prefix
    """
    if not repo_name:
        return repo_name
        
    arch = get_arch_from_status_path(status_file_path)
    if arch and not any(repo_name.startswith(f"{prefix}_") for prefix in ARCH_SUFFIXES):
        prefixed_name = f"{arch}_{repo_name}"
        logger.info(f"Auto-prefixed repo_name with architecture: {prefixed_name}")
        return prefixed_name
    return repo_name


def _update_existing_line(line: str, package_name: str, package_type: str, status: str, repo_name: str, status_file_path: str) -> str:
    """Update an existing line in status file.
    
    Args:
        line: Existing line content
        package_name: Package name to match
        package_type: Package type
        status: New status
        repo_name: Repository name
        status_file_path: Path for architecture extraction
        
    Returns:
        str: Updated line content
    """
    parts = line.strip().split(',')
    if len(parts) >= 4:
        final_repo_name = _prefix_repo_name_with_arch(repo_name, status_file_path, None)
        parts[2] = final_repo_name if final_repo_name else ''
        parts[3] = status
        return ','.join(parts) + '\n'
    
    # Handle short lines
    final_repo_name = _prefix_repo_name_with_arch(repo_name, status_file_path, None)
    return f"{package_name},{package_type},{final_repo_name if final_repo_name else ''},{status}\n"


def write_status_to_file(status_file_path, package_name, package_type, status, logger, file_lock: Lock, repo_name=None):
    """
    Writes or updates the status of a package in the status file.
    
    Args:
        status_file_path: Path to the status file
        package_name: Name of the package
        package_type: Type of the package (rpm, image, etc.)
        status: Status (Success, Failed, etc.)
        logger: Logger instance
        file_lock: Lock for thread safety
        repo_name: Optional repository name (for RPMs)
    """
    logger.info("#" * 30 + f" {write_status_to_file.__name__} start " + "#" * 30)

    # Auto-prefix repo_name with architecture if needed
    repo_name = _prefix_repo_name_with_arch(repo_name, status_file_path, logger)

    try:
        with file_lock:  # Ensure only one process can write at a time
            if os.path.exists(status_file_path):
                _update_existing_file(status_file_path, package_name, package_type, status, repo_name)
            else:
                _create_new_file(status_file_path, package_name, package_type, status, repo_name)

            logger.info(f"Status written to {status_file_path} for {package_name}.")
    except OSError as e:
        logger.error(f"Failed to write to status file: {status_file_path}. Error: {str(e)}")
        raise RuntimeError(
            f"Failed to write to status file: {status_file_path}. Error: {str(e)}"
        ) from e
    finally:
        logger.info("#" * 30 + f" {write_status_to_file.__name__} end " + "#" * 30)


def _update_existing_file(status_file_path, package_name, package_type, status, repo_name):
    """Update existing status file with new package status."""
    with open(status_file_path, "r", encoding='utf-8') as f:
        lines = f.readlines()

    updated = False
    with open(status_file_path, "w", encoding='utf-8') as f:
        # Write header
        if lines:
            f.write(lines[0])

        # Write data lines
        for line in lines[1:]:  # Skip header
            if line.startswith(f"{package_name},"):
                updated_line = _update_existing_line(
                    line, package_name, package_type, status, repo_name, status_file_path
                )
                f.write(updated_line)
                updated = True
            else:
                f.write(line)

        if not updated:
            final_repo_name = _prefix_repo_name_with_arch(repo_name, status_file_path, None)
            f.write(f"{package_name},{package_type},{final_repo_name if final_repo_name else ''},{status}\n")


def _create_new_file(status_file_path, package_name, package_type, status, repo_name):
    """Create new status file with package status."""
    with open(status_file_path, "w", encoding='utf-8') as f:
        f.write(STATUS_CSV_HEADER)
        final_repo_name = _prefix_repo_name_with_arch(repo_name, status_file_path, None)
        f.write(f"{package_name},{package_type},{final_repo_name if final_repo_name else ''},{status}\n")


================================================
FILE: common/library/module_utils/local_repo/process_metadata.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

# pylint: disable=import-error,no-name-in-module
#!/usr/bin/python

from datetime import datetime
from pathlib import Path
import os
import json
import yaml
# Import default variables from config.py
from ansible.module_utils.local_repo.config import ARCH_SUFFIXES

def load_yaml(path):
    """
    Load YAML content from the given file path.

    Returns an empty dictionary if the file does not exist,
    or if the file is empty/null.
    """
    if not os.path.isfile(path):
        return {}
    with open(path, 'r') as f:
        return yaml.safe_load(f) or {}

def write_yaml(path, data):
    """
    Write the given data (dict) to a file in YAML format.

    Uses block-style formatting (not flow style).
    """
    os.makedirs(os.path.dirname(path), exist_ok=True)
    with open(path, 'w') as f:
        yaml.dump(data, f, default_flow_style=False)

def load_config(config_path: str) -> dict:
    """
    Load and parse JSON configuration from the specified file path.

    Raises FileNotFoundError if the file does not exist.
    """
    if not os.path.exists(config_path):
        raise FileNotFoundError(f"Config file not found: {config_path}")
    with open(config_path) as f:
        return json.load(f)

def generate_policy_dict(repo_list, default_policy):
    """
    Generate a dictionary mapping each repository name (normalized) to its policy.

    If a repository does not define a 'policy', use the provided default_policy.
    """
    policy_dict = {}
    for repo in repo_list:
        name_key = f"{repo['name'].replace('-', '_')}_policy"
        # Use the repo's policy or the default if not provided
        policy_value = repo.get('policy', default_policy)
        policy_dict[name_key] = policy_value
    return policy_dict

def update_metadata_file(file_path: str, repo_src_name: str, new_policy: dict):
    """
    Update the metadata YAML file with a new policy for a given repository source name.

    - Loads existing metadata from the file.
    - Updates or adds the new policy under the given repo_src_name key.
    - Writes the updated metadata back to the file.
    """
    if os.path.exists(file_path):
        existing_metadata = load_yaml(file_path)
    else:
        existing_metadata = {}

    existing_metadata[repo_src_name] = new_policy
    write_yaml(file_path, existing_metadata)

def append_metadata_footer(output_file: str, repo_mode: str):
    """
    Append additional metadata footer information to the metadata YAML file.

    - Adds/updates the 'repository_mode' key with the given repo_mode value.
    - Adds/updates the 'lastrun_timestamp' with the current UTC timestamp.
    - Writes the updated metadata back to the file.
    """
    metadata = load_yaml(output_file)
    metadata['repository_mode'] = repo_mode
    metadata['lastrun_timestamp'] = datetime.utcnow().strftime('%Y-%m-%dT%H:%M:%SZ')
    write_yaml(output_file, metadata)

def deep_update(orig_dict, new_dict):
    """
    Recursively update a dictionary with another dictionary.

    - For each key in new_dict:
      - If the value is a dictionary and the corresponding value in orig_dict is also a dictionary,
        recursively update the nested dictionary.
      - Otherwise, set or overwrite the value in orig_dict with the value from new_dict.
    - Returns the updated orig_dict.
    """
    for key, value in new_dict.items():
        if isinstance(value, dict):
            # Recursively update nested dictionaries
            orig_dict[key] = deep_update(orig_dict.get(key, {}), value)
        else:
            # Overwrite or add the value
            orig_dict[key] = value
    return orig_dict

def get_diff(base, other):
    """
    Compute the difference between two dictionaries.

    - For each key in 'other':
      - If the key does not exist in 'base', include it in the diff.
      - If the value is a dictionary in both 'base' and 'other',
        compute the nested difference recursively.
      - If the values differ, include the value from 'other' in the diff.
    - Returns a dictionary containing only the differing keys and values.
    """

    diff = {}
    for key, value in other.items():
        if key not in base:
            diff[key] = value
        elif isinstance(value, dict) and isinstance(base.get(key), dict):
            nested_diff = get_diff(base[key], value)
            if nested_diff:
                diff[key] = nested_diff
        elif base[key] != value:
             # Value differs
            diff[key] = value
    return diff

def get_os_type(config):
    """
    Extract and validate the OS type from the given configuration.

    - Reads the value of 'cluster_os_type' from the config dictionary.
    - Converts it to lowercase for consistency.
    - Validates that the OS type is one of the supported values: 'rhel', 'rockey', or 'ubuntu'.
    - If the OS type is not supported, the module fails with an error.
    - Returns the validated OS type string.

    Parameters:
        config (dict): Configuration dictionary that should contain 'cluster_os_type'.

    Returns:
        str: Validated OS type.
    """
    cluster_os_type = config.get('cluster_os_type', '').lower()

    if cluster_os_type not in ['rhel', 'rockey', 'ubuntu']:
        raise ValueError(f"Unsupported cluster_os_type: {cluster_os_type}")

    return cluster_os_type


def handle_generate_metadata(sw_config,repo_data,output_file,sub_urls=None):
    """
    Generates metadata for repository configurations based on the provided software configuration
    and repository data files. The metadata is written to the specified output file.

    Parameters:
        sw_config (str): Path to the software configuration JSON file.
        repo_data (str): Path to the local repository YAML data file.
        output_file (str): Path where the generated metadata should be written.
        sub_urls (dict, optional): Mapping of arch to list of subscription repo dicts
            (from RHEL subscription). When provided, these are recorded under
            rhel_subscription_url_{arch} in the metadata.

    Returns:
        dict: A dictionary containing the last repo key processed and its generated policy.
    """

    # Load the software configuration and repo data from files
    config = load_config(sw_config)
    repo_data = load_yaml(repo_data)

    # Fetch the default repository policy, fallback to "always" if not set
    default_policy = config.get("repo_config", "always")

    # Determine the OS type from the config (e.g., rhel, ubuntu, etc.)
    os_type = get_os_type(config)

    # Define the keys in the repo_data to process, based on OS type
    keys_to_process = (
        [f'user_repo_url_{arch}' for arch in ARCH_SUFFIXES] +
        [f'omnia_repo_url_{os_type}_{arch}' for arch in ARCH_SUFFIXES] +
        [f'{os_type}_os_url_{arch}' for arch in ARCH_SUFFIXES] +
        [f'{os_type}_subscription_repo_config_{arch}' for arch in ARCH_SUFFIXES] +
        [f'additional_repos_{arch}' for arch in ARCH_SUFFIXES]
    )
    last_key = None
    last_policy = {}
    # Iterate over each key and generate/update policy metadata
    for key in keys_to_process:
        repo_list = repo_data.get(key, [])
        if not repo_list:
            continue  # Skip processing if key is missing or value is None/empty
        repo_src_name = key
        new_policy = generate_policy_dict(repo_list, default_policy)
        update_metadata_file(output_file, repo_src_name, new_policy)
        last_key = repo_src_name
        last_policy = new_policy

    # Record RHEL subscription repos if provided (in-memory URLs from subscription manager)
    if sub_urls:
        for arch in ARCH_SUFFIXES:
            arch_repos = sub_urls.get(arch, [])
            if arch_repos:
                sub_key = f"{os_type}_subscription_url_{arch}"
                sub_policy = generate_policy_dict(arch_repos, default_policy)
                update_metadata_file(output_file, sub_key, sub_policy)
                last_key = sub_key
                last_policy = sub_policy

    # Append common footer metadata such as repo mode and timestamp
    append_metadata_footer(output_file,default_policy)

    # Return the last policy generated as a summary result
    return {last_key: last_policy} if last_key else {}


def handle_compare_data(original_file,updated_file,ignore_keys):
    """
    Compares two YAML files after removing specified keys from both.

    This function is typically used to check whether two metadata files are
    identical, ignoring fields that are expected to change (e.g., timestamps).

    Parameters:
        original_file (str): Path to the original YAML file.
        updated_file (str): Path to the updated YAML file.
        ignore_keys (list): List of keys to ignore during comparison.

    Returns:
        dict: {
            "changed": True if files differ (ignoring ignored keys),
            "identical": True if files are the same (after ignoring keys)
        }
    """

    original_data = load_yaml(original_file)
    updated_data = load_yaml(updated_file)

    # Remove ignore_keys from both datasets
    for key in ignore_keys:
        original_data.pop(key, None)
        updated_data.pop(key, None)

    # Compare the filtered data
    same = original_data == updated_data
    # Return the result of comparison
    return {
        "changed": not same, # True if files are different
        "identical": same    # True if files are identical
    }


def handle_update_data(original_file,updated_file,ignore_keys):
    """
    Updates the original metadata file with differences from the updated file,
    excluding specified keys, and appends a 'lastrun_timestamp'.

    Parameters:
        original_file (str): Path to the existing metadata file.
        updated_file (str): Path to the new metadata file to merge from.
        ignore_keys (list): List of top-level keys to ignore when comparing.

    Returns:
        dict: {
            "changed": True if any differences were found and merged,
            "diff": Dictionary of the detected differences
        }
    """

    original_data = load_yaml(original_file)
    updated_data = load_yaml(updated_file)

    # Remove keys that should be ignored during diff
    for key in ignore_keys:
        original_data.pop(key, None)
        updated_data.pop(key, None)

    # Compute the differences between the cleaned original and updated data
    diff = get_diff(original_data, updated_data)

    if diff:
        # If differences exist, apply them using deep merge
        new_data = deep_update(original_data, diff)
        new_data['lastrun_timestamp'] = datetime.utcnow().strftime('%Y-%m-%dT%H:%M:%SZ')
        # Write merged data back to the original file
        write_yaml(original_file, new_data)
    else:
        # If no differences, just update the timestamp
        new_data = original_data
        new_data['lastrun_timestamp'] = datetime.utcnow().strftime('%Y-%m-%dT%H:%M:%SZ')
        write_yaml(original_file, new_data)

    # Delete the temporary updated metadata file
    Path(updated_file).unlink(missing_ok=True)

    # Return whether the original file was changed and the diff
    return {
        "changed": bool(diff),   
        "diff": diff             
    }


================================================
FILE: common/library/module_utils/local_repo/process_parallel.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# pylint: disable=import-error,no-name-in-module,too-many-positional-arguments,too-many-locals,too-many-arguments
"""This module handles parallel processing tasks for local repository."""

import os
import logging
import multiprocessing
import subprocess
import time
import threading
import traceback
import json
import yaml
import json
import requests
from jinja2 import Template
from ansible.module_utils.local_repo.common_functions import (
    load_yaml_file,
    is_encrypted,
    process_file
)
from ansible.module_utils.local_repo.config import (
    OMNIA_CREDENTIALS_YAML_PATH,
    OMNIA_CREDENTIALS_VAULT_PATH,
    # USER_REG_CRED_INPUT,
    # USER_REG_KEY_PATH
)
# Global lock for logging synchronization
log_lock = multiprocessing.Lock()

def load_docker_credentials(vault_yml_path, vault_password_file):
    """
    Decrypts an Ansible Vault YAML file, extracts docker_username and docker_password,
    and validates them using Docker Hub API.

    Validation Logic:
        - Validates credentials via Docker Hub REST API
        - Returns credentials if authentication succeeds (HTTP 200)
        - Raises RuntimeError for all authentication failures

    Args:
        vault_yml_path (str): Path to the encrypted Ansible Vault YAML file.
        vault_password_file (str): Path to the vault password file.

    Returns:
        tuple: (docker_username, docker_password) or (None, None) if not provided.

    Raises:
        RuntimeError: If vault decryption fails, YAML parsing fails, Docker Hub API 
                     authentication fails, network errors occur, or requests module 
                     is not installed.
    """
    try:
        env = os.environ.copy()
        env["ANSIBLE_VAULT_PASSWORD_FILE"] = vault_password_file

        result = subprocess.run(
            ["ansible-vault", "view", vault_yml_path],
            capture_output=True,
            text=True,
            check=True,
            env=env
        )
        data = yaml.safe_load(result.stdout)
        docker_username = data.get("docker_username")
        docker_password = data.get("docker_password")

        # If either credential is missing, skip validation
        if not docker_username or not docker_password:
            return None, None

        # Validate credentials using Docker Hub API
        try:
            payload = json.dumps({"username": docker_username, "password": docker_password})
            response = requests.post(
                "https://hub.docker.com/v2/users/login/",
                data=payload,
                headers={
                    "Content-Type": "application/json",
                    "User-Agent": "curl/8.0"
                },
                timeout=30
            )

            if response.status_code == 200:
                return docker_username, docker_password

            if response.status_code == 429:
                raise RuntimeError("Docker Hub rate limit exceeded. Please try again later.")

            # Handle authentication failures
            if response.status_code == 401:
                raise RuntimeError("Invalid Docker Hub username or password.")

            # Handle malformed client request
            if response.status_code == 400:
                raise RuntimeError("Bad request sent to Docker Hub. Check username/password format.")

            # Handle server-side errors (5xx)
            if 500 <= response.status_code < 600:
                raise RuntimeError(
                    f"Docker Hub server error (status {response.status_code}). Try again later."
                )

            # Catch-all for other unexpected statuses
            raise RuntimeError(
                f"Docker Hub authentication failed with unexpected status {response.status_code}."
            )

        except requests.RequestException as error:
            raise RuntimeError(
                "Unable to reach Docker Hub (network DNS/timeout/SSL issue)."
            ) from error

    except subprocess.CalledProcessError as error:
        raise RuntimeError(f"Vault decryption failed: {error.stderr.strip()}") from error
    except yaml.YAMLError as error:
        raise RuntimeError(f"Failed to parse decrypted YAML: {error}") from error

def log_table_output(table_output, log_file):
    """
    Writes the provided table output to a log file.
    Args:
        table_output (str): The table output to be written to the log file.
        log_file (str): The path of the log file where the table output should be written.
    Raises:
        RuntimeError: If there is an error during the file writing process or directory creation.
    """
    try:
        # Ensure the directory for the log file exists
        os.makedirs(os.path.dirname(log_file), exist_ok=True)
        # Write the table output to the log file
        with open(log_file, "w") as file:
            file.write("Command Execution Results Table:\n")  # Add a header to the table
            file.write(table_output)  # Write the actual table content
    except Exception as e:
        # If there is an error, raise a RuntimeError with the error message
        raise RuntimeError(f"Failed to write table output to log file: {str(e)}")

def setup_logger(log_dir,log_file_path):
    """
    Sets up and configures a logger to write logs to a specified file.
    Args:
        log_file_path (str): The path where the log file will be saved.
    Returns:
        logging.Logger: The configured logger instance.
    """
    # Ensure the log directory exists
    os.makedirs(log_dir, exist_ok=True)
    logger = logging.getLogger(log_file_path)  # Create a logger with the provided log file path
    logger.setLevel(logging.INFO)  # Set the log level to INFO
    # Check if the logger already has handlers to avoid duplicate log entries
    if not logger.hasHandlers():
        # Create a file handler to write logs to the specified file
        file_handler = logging.FileHandler(log_file_path)
        # Define the format for log messages
        formatter = logging.Formatter('%(asctime)s - %(name)s - %(levelname)s - %(message)s')
        # Apply the formatter to the file handler
        file_handler.setFormatter(formatter)
        # Add the file handler to the logger
        logger.addHandler(file_handler)
    return logger

def execute_task(task, determine_function, user_data, version_variables, arc,
                repo_store_path, csv_file_path,logger, user_registries,
                docker_username, docker_password, timeout=None):
    """
    Executes a task by determining the appropriate function to call, managing execution time, 
    handling timeouts, and logging the results.

    Args:
        task (dict): The task to execute, expected to contain necessary details such as "package".
        determine_function (function): A function that takes a task, repo_store_path,
                                       and csv_file_path and returns the function to
                                       call and its arguments.
        arc (str): Architecture of package to be downloaded
        repo_store_path (str): The path to the repository where files are stored.
        csv_file_path (str): Path to a CSV file to be processed as part of the task.
        logger (logging.Logger): The logger instance for logging the task's execution.
        timeout (float, optional): The maximum time allowed for the task to execute.
        user_registries (str): List of user registries 

    Returns:
        dict: A dictionary containing the task information, its execution status,
              any output, and any errors.
    """
    try:
        start_time = time.time()  # Track the start time of the task execution
        with log_lock:
            logger.info(f"### {execute_task.__name__} start ###")  # Log task start

        # Build package display name with tag for images
        package_display = task.get("package", "")
        if task.get("type") == "image" and "tag" in task:
            package_display = f"{package_display}:{task['tag']}"
        elif task.get("type") == "image" and "digest" in task:
            package_display = f"{package_display}:{task['digest']}"

        # Determine the function and its arguments using the provided `determine_function`
        function, args = determine_function(task, repo_store_path, csv_file_path, user_data,
                         version_variables, arc, user_registries, docker_username, docker_password)

        while True:
            elapsed_time = time.time() - start_time  # Calculate elapsed time
            logger.info(f"--->{elapsed_time:.2f}s.")  # Log the elapsed time

            # Check if the timeout has been reached
            if timeout and elapsed_time > timeout:
                with log_lock:
                    logger.info(
                      f"Timeout reached ({elapsed_time:.2f}s), stopping task execution for {task}."
                    )
                return {
                    "task": task,
                    "package": package_display,
                    "status": "TIMEOUT",
                    "output": "",
                    "error": f"Timeout reached after {elapsed_time:.2f}s"
                }

            # Execute the task and get the result
            result = function(*args, logger=logger)

            # If the function has completed successfully, break out of the loop
            if result:
                break

            # If the task hasn't finished yet, wait before retrying
            time.sleep(0.1)

        # Log the success and return the result
        with log_lock:
            logger.info(f"Task {function.__name__} succeeded.")
            logger.info(f"### {execute_task.__name__} end ###")

        return {
            "task": task,
            "package": package_display,
            "status": result.upper(),  
            "output": result,
            "error": ""
        }
    except Exception as e:
        # Log the error if the task fails
        with log_lock:
            logger.error(f"Task failed: {str(e)}")
        return {
            "task": task,
            "package": package_display,
            "status": "FAILED",  
            "output": "",
            "error": str(e)  # Include the error message
        }
def worker_process(task, determine_function, user_data, version_variables, arc, repo_store_path,
                  csv_file_path, log_dir, result_queue, user_registries,
                  docker_username, docker_password, timeout):
    """
    Executes a task in a separate worker process, logs the process execution,
    and puts the result in a result queue.
    Args:
        task (dict): The task to be processed, containing details like the package to be processed.
        determine_function (function): A function that determines the function to call
        and its arguments for the task.
        user_data: content from software_config.json
        version_variables: softwarename_version for versioned softwares
        arc: Architecture of software
        repo_store_path (str): Path to the repository where task-related files are stored.
        csv_file_path (str): Path to a CSV file that may be needed for processing the task.
        log_dir (str): Directory where log files for the worker process should be saved.
        result_queue (multiprocessing.Queue): Queue for putting the result of the 
        task execution (used for inter-process communication).
        docker_username: Docker username provided by the user
        docker_password: Docker password for the provided username
        user_registries (str): List of user registries
        timeout (float): The maximum allowed time for the task execution.
    Returns:
        None: The result is placed into the `result_queue`, so no return value is needed.
    """
    #Define the log file path using process ID for uniqueness
    thread_log_path = os.path.join(log_dir, f"package_status_{os.getpid()}.log")
    # Setup logger specific to this worker process
    logger = setup_logger(log_dir,thread_log_path)
    try:
        # Log the start of the worker process execution
        with log_lock:
            logger.info(f"Worker process {os.getpid()} started  execution.")
        # Execute the task by calling the `execute_task` function and passing necessary arguments
        result = execute_task(task, determine_function, user_data, version_variables, arc,
                             repo_store_path, csv_file_path, logger, user_registries,
                             docker_username, docker_password, timeout)
        result["logname"] = f"package_status_{os.getpid()}.log"
        # Put the result of the task execution into the result_queue for further processing
        result_queue.put(result)
        # Log the successful completion of the task execution
        with log_lock:
            logger.info(f"Worker process {os.getpid()} completed task execution.")
    except Exception as e:
        # Log any errors encountered during task execution
        with log_lock:
            logger.error("Worker process %s encountered an internal error.", os.getpid())
        # If an error occurs, put a failure result in the queue indicating task failure
        # Return a safe, generic error message to caller
        safe_error_message = "Task execution failed due to an internal error."
        result_queue.put({"task": task, "status": "FAILED", "output": "", "error": safe_error_message })

def execute_parallel(
    tasks,
    determine_function,
    nthreads,
    repo_store_path,
    csv_file_path,
    log_dir,
    user_data,
    version_variables,
    arc,
    standard_logger,
    local_repo_config_path,
    # user_reg_cred_input,
    # user_reg_key_path,
    omnia_credentials_yaml_path,
    omnia_credentials_vault_path,
    timeout
):
    """
    Executes a list of tasks in parallel using multiple worker processes.
    Args:
        tasks (list): A list of tasks (dictionaries) that need to be processed in parallel.
        determine_function (function): A function that determines which function to 
        execute and its arguments for each task.
        nthreads (int): The number of worker processes to run in parallel.
        repo_store_path (str): Path to the repository where task-related files are stored.
        csv_file_path (str): Path to a CSV file that may be needed for processing some tasks.
        log_dir (str): Directory where log files for the worker processes will be saved.
        standard_logger (logging.Logger): A shared logger for overall task execution.
        timeout (float, optional): The maximum time allowed for all tasks to execute.
        If `None`, no timeout is enforced.
        local_repo_config_path (str): Path for local_repo_config.yml
    Returns:
        tuple: A tuple containing:
            - overall_status (str): The overall status of task 
              execution ("SUCCESS", "FAILED", "PARTIAL", "TIMEOUT").
            - task_results_data (list): A list of dictionaries,
              each containing the result of an individual task.
    """
    # Create a shared queue for collecting task results from worker processes
    result_queue = multiprocessing.Manager().Queue()
    with log_lock:
        standard_logger.info("Starting parallel task execution.")

    config = load_yaml_file(local_repo_config_path)
    user_registries = config.get("user_registry", [])
    # if user_registries:
    #     if is_encrypted(user_reg_cred_input):
    #         process_file(user_reg_cred_input, user_reg_key_path, 'decrypt')

    #     file2_data = load_yaml_file(user_reg_cred_input)
    #     cred_lookup = {
    #         entry['name']: entry
    #         for entry in file2_data.get('user_registry_credential', [])
    #     }
    #     # Update user_registry entries with credentials if required
    #     for registry in user_registries:
    #         if registry.get("requires_auth"):
    #             creds = cred_lookup.get(registry.get("name"))
    #             if creds:
    #                 registry["username"] = creds.get("username")
    #                 registry["password"] = creds.get("password")


    try:
        docker_username, docker_password = load_docker_credentials(omnia_credentials_yaml_path,
                                                                  omnia_credentials_vault_path)
    except RuntimeError as e:
        raise
    # Create a pool of worker processes to handle the tasks
    with multiprocessing.Pool(processes=nthreads) as pool:
        task_results = []  # List to hold references to the async results of the tasks

        # Submit each task to the pool for parallel execution
        for task in tasks:
            package_template = Template(task.get('package', None))
            package_name = package_template.render(**version_variables)
            task['package'] = package_name
            task_results.append(pool.apply_async(worker_process, (task, determine_function, user_data,
                               version_variables, arc, repo_store_path, csv_file_path, log_dir, result_queue,
                               user_registries,docker_username, docker_password, timeout)))

        pool.close()  # Close the pool to new tasks once all have been submitted
        start_time = time.time()  # Start time for overall task execution
        tasks_are_not_completed = False
        # Check the status of the tasks periodically and enforce the timeout if necessary
        while task_results:
            elapsed_time = time.time() - start_time  # Calculate elapsed time
            if timeout and elapsed_time > timeout:  # Check if overall timeout has been reached
                with log_lock:
                    standard_logger.warning(
                       f"Overall timeout reached ({elapsed_time:.2f}s), stopping remaining tasks."
                )
                pool.terminate()  # Terminate all tasks if timeout occurs
                tasks_are_not_completed = True  # Mark that not all tasks have completed
                break

            # Remove tasks that have already completed (they are marked as 'ready')
            task_results = [task for task in task_results if not task.ready()]
            time.sleep(0.1)  # Sleep to avoid tight looping

        pool.join()  # Ensure all worker processes have completed
    # Collect all the results from the result queue
    task_results_data = []
    while not result_queue.empty():
        task_results_data.append(result_queue.get())
    # Determine the overall status based on individual task results
    if tasks_are_not_completed:
        overall_status = "TIMEOUT"  # If timeout occurred before completion, set status as "TIMEOUT"
    else:
        # Check if all tasks failed, all succeeded, or if there was a mix (partial success)
        all_failed = all(result["status"] == "FAILED" for result in task_results_data)
        overall_status = "FAILED" if all_failed else "SUCCESS" if all(result["status"] == "SUCCESS" for result in task_results_data) else "PARTIAL"
    # Log the final status of task execution
    with log_lock:
        standard_logger.info(f"Task execution finished with overall status: {overall_status}")
    # Return the overall status and the results of each task
    return overall_status, task_results_data


================================================
FILE: common/library/module_utils/local_repo/registry_utils.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# pylint: disable=import-error,no-name-in-module
import requests
import socket
import ssl
from requests.auth import HTTPBasicAuth
from ansible.module_utils.local_repo.common_functions import is_file_exists

def is_https(host, timeout=1):
    """
    Check whether the given host is serving HTTPS (TLS).
 
    Attempts a TLS handshake without verifying the server certificate.
 
    Args:
        host (str): The host address in "ip:port" format.
        timeout (int, optional): Connection timeout in seconds. Defaults to 1.
 
    Returns:
        bool: True if the host supports HTTPS/TLS, False otherwise.
    """
    ip, port = host.rsplit(":", 1)
    port = int(port)

    context = ssl.create_default_context()
    context.check_hostname = False
    context.verify_mode = ssl.CERT_NONE

    result = False
    sock = None
    wrapped_sock = None

    try:
        sock = socket.create_connection((ip, port), timeout=timeout)
        wrapped_sock = context.wrap_socket(sock, server_hostname=ip)
        result = True

    except (ssl.SSLError, OSError):
        result = False

    finally:
        # Close wrapped socket first
        if wrapped_sock is not None:
            try:
                wrapped_sock.shutdown(socket.SHUT_RDWR)
            except Exception:
                pass
            try:
                wrapped_sock.close()
            except Exception:
                pass

        # Then explicitly close original socket
        if sock is not None:
            try:
                sock.close()
            except Exception:
                pass

    return result

def validate_user_registry(user_registry):
    """
    Validates a list of user registry entries with connectivity and credential check.
    Args:
        user_registry (list): List of user registry dictionaries.
    Returns:
        tuple: (bool, str) indicating overall validity and error message if invalid.
    """
    if not isinstance(user_registry, list):
        return False, "user_registry must be a list."

    for idx, item in enumerate(user_registry):
        if not isinstance(item, dict):
            return False, f"Entry at index {idx} must be a dictionary."

        host = item.get('host')
        if not host:
            return False, f"Missing or empty 'host' in entry at index {idx}: {item}"
        https = is_https(host)

        cert_path = (item.get("cert_path") or "").strip()
        key_path  = (item.get("key_path")  or "").strip()

        if https and (not cert_path or not key_path):
            return False, f"{host} is an HTTPS registry and requires cert_path and key_path. Please provide cert_path and key_path in local_repo_config.yml under user_registry section"

    return True, ""

        # requires_auth = item.get('requires_auth', False)

        # # Check basic username/password presence
        # if requires_auth:
        #     if not item.get('username') or not item.get('password'):
        #         return False, (
        #             f"'requires_auth' is true but 'username' or 'password' is missing or empty "
        #             f"in entry for (host: {host})"
        #         )

        #     cert_path = item.get('cert_path')
        #     key_path = item.get('key_path')

    #         if bool(cert_path) != bool(key_path):
    #             return False, (
    #                 f"If authentication is enabled, both 'cert_path' and 'key_path' must be present "
    #                 f"or both omitted in entry for (host: {host})"
    #             )
    #         try:
    #             url = f"https://{host}/api/v2.0/users/current"
    #             response = requests.get(
    #                 url,
    #                 auth=HTTPBasicAuth(item['username'], item['password']),
    #                 verify=True  # Set to True if using valid SSL certs
    #             )

    #             if response.status_code == 401:
    #                 return False, f"Invalid credentials for host: {host}"
    #             elif response.status_code != 200:
    #                 return False, f"Unexpected status {response.status_code} while validating host: {host}"

    #         except requests.exceptions.RequestException as e:
    #             return False, f"Failed to connect to {host}: {str(e)}"

    # return True, ""

def tcp_ping(host, timeout=1):
    """
    Check if a host:port is reachable via TCP.
    
    Args:
        host (str): User registry host with port
        timeout (int): Timeout in seconds
    Returns:
        bool: True if reachable, False otherwise
    """
    try:
        if ":" in host:
            hostname, port = host.split(":")
            port = int(port)
        else:
            hostname = host
            port = 443

        with socket.create_connection((hostname, port), timeout=timeout):
            return True
    except Exception:
        return False

def check_reachability(user_registry, timeout=1):
    """
    Check reachability of hosts in a user registry.
    
    Args:
        user_registry (list): List of dicts, each with a 'host' key
        timeout (int): TCP connection timeout in seconds
    Returns:
        tuple: (reachable_hosts, unreachable_hosts)
    """
    reachable, unreachable = [], []
    for item in user_registry:
        host = item['host']
        if tcp_ping(host, timeout):
            reachable.append(host)
        else:
            unreachable.append(host)
    return reachable, unreachable

def find_invalid_cert_paths(user_registry):
    """
    Finds invalid certificate/key path configurations in the user registry.

    Rules:
    - If cert_path is provided, key_path must also be provided, and vice versa.
    - If either path is provided, the corresponding file must exist.

    Args:
        user_registry (list): List of dictionaries representing user registry entries.

    Returns:
        list: A list of error strings describing invalid entries.
    """
    invalid_entries = []

    for idx, item in enumerate(user_registry):
        cert_path = item.get('cert_path')
        key_path = item.get('key_path')
        name_or_host = item.get('name') or item.get('host') or f"entry {idx}"

        # If only one of cert or key is provided
        if bool(cert_path) != bool(key_path):
            invalid_entries.append(
                f"{name_or_host}: Both 'cert_path' and 'key_path' must be provided together or not at all."
            )
            continue

        # If both are provided, validate file existence
        if cert_path and not is_file_exists(cert_path):
            invalid_entries.append(f"{name_or_host}: cert_path '{cert_path}' does not exist.")

        if key_path and not is_file_exists(key_path):
            invalid_entries.append(f"{name_or_host}: key_path '{key_path}' does not exist.")

    return invalid_entries


================================================
FILE: common/library/module_utils/local_repo/rest_client.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import json
import http.client
import ssl
import base64
from urllib.parse import urlparse

class RestClient:
    """
    REST client to interact with HTTP(S) endpoints using JSON-based POST and GET requests.
    SSL verification is disabled for all requests.

    Args:
        base_url (str): The base URL of the server (e.g., https://localhost:443).
        username (str): Username for basic authentication.
        password (str): Password for basic authentication.
    """

    def __init__(self, base_url, username, password):
        self.base_url = base_url
        self.username = username
        self.password = password
        auth = f"{username}:{password}"
        auth_encoded = base64.b64encode(auth.encode()).decode()
        self.headers = {
            "Content-type": "application/json",
            "Authorization": f"Basic {auth_encoded}"
        }

    def get_connection(self):
        """
        Creates an HTTP or HTTPS connection to the server.
        For HTTPS, SSL verification is disabled.
 
        Returns:
            http.client.HTTPConnection or http.client.HTTPSConnection: A connection instance.
        """
        parsed_url = urlparse(self.base_url)
 
        if parsed_url.scheme == 'https':
            context = ssl._create_unverified_context()
            return http.client.HTTPSConnection(parsed_url.hostname, parsed_url.port, context=context, timeout=60)
        # http support is disabled
        # elif parsed_url.scheme == 'http':
        #     return http.client.HTTPConnection(parsed_url.hostname, parsed_url.port, timeout=60)
        return None

    def post(self, uri, data):
        """
        Sends a POST request with a JSON body to the specified URI.

        Args:
            uri (str): The endpoint URI.
            data (dict): Data to send as JSON.

        Returns:
            dict or None: Parsed JSON response if successful, None otherwise.
        """
        conn = self.get_connection()
        try:
            conn.request("POST", uri, body=json.dumps(data), headers=self.headers)
            response = conn.getresponse()
            if response.status != 202:
                return None
            return json.loads(response.read())
        except Exception:
            return None
        finally:
            conn.close()

    def get(self, uri):
        """
        Sends a GET request and parses the response as JSON.

        Args:
            uri (str): The endpoint URI.

        Returns:
            dict or None: Parsed JSON response if status is 200, None otherwise.
        """
        conn = self.get_connection()
        try:
            conn.request("GET", uri, headers=self.headers)
            response = conn.getresponse()
            if response.status != 200:
                return None
            return json.loads(response.read())
        except Exception:
            return None
        finally:
            conn.close()

    def raw_get(self, uri):
        """
        Sends a GET request and returns the raw HTTP response.

        Args:
            uri (str): The endpoint URI.

        Returns:
            http.client.HTTPResponse or None: Response object if request succeeds, None otherwise.
        """
        conn = self.get_connection()
        try:
            conn.request("GET", uri, headers=self.headers)
            return conn.getresponse()
        except Exception:
            return None


================================================
FILE: common/library/module_utils/local_repo/software_utils.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# pylint: disable=import-error,no-name-in-module,too-many-branches,too-many-statements

"""
This module util contains all custom software utilities used across custom modules
"""
from collections import defaultdict
import os
import json
import csv
import re
import shlex
import yaml
from jinja2 import Template
import requests
from ansible.module_utils.local_repo.standard_logger import setup_standard_logger
from ansible.module_utils.local_repo.common_functions import is_encrypted, process_file, get_arch_from_sw_config
from ansible.module_utils.local_repo.parse_and_download import execute_command
# Import default variables from config.py
from ansible.module_utils.local_repo.config import (
    PACKAGE_TYPES,
    CSV_COLUMNS,
    SOFTWARE_CONFIG_SUBDIR,
    DEFAULT_STATUS_FILENAME,
    RPM_LABEL_TEMPLATE,
    RHEL_OS_URL,
    SOFTWARES_KEY,
    POLICY_CACHING_MAP,
    DEFAULT_POLICY,
    DEFAULT_CACHING,
    ARCH_SUFFIXES,
    ADDITIONAL_REPOS_KEY,
    pulp_container_commands
)


def load_json(file_path):
    """
    Load JSON data from a file.

    Args:
        file_path (str): The path to the JSON file.

    Returns:
        dict: The loaded JSON data.

    Raises:
        FileNotFoundError: If the file is not found.
        ValueError: If the JSON parsing fails.
    """
    try:
        with open(file_path, 'r') as file:
            return json.load(file)
    except FileNotFoundError as exc:
        raise FileNotFoundError(f"Error: File '{file_path}' not found.") from exc
    except json.JSONDecodeError as exc:
        raise ValueError(f"Error: Failed to parse JSON in file '{file_path}'.") from exc


def load_yaml(file_path):
    """
    Load YAML data from a file.

    Args:
        file_path (str): The path to the YAML file.

    Returns:
        dict: The loaded YAML data.

    Raises:
        FileNotFoundError: If the file is not found.
        yaml.YAMLError: If the YAML parsing fails.
    """
    with open(file_path, 'r', encoding='utf-8') as file:
        return yaml.safe_load(file)

def get_json_file_path(software_name, cluster_os_type,
                       cluster_os_version, user_json_path, arch):
    """
    Generate the file path for a JSON file based on the provided software name,
     cluster OS type, cluster OS version, and user JSON path.

    Parameters:
        software_name (str): The name of the software.
        cluster_os_type (str): The type of the cluster operating system.
        cluster_os_version (str): The version of the cluster operating system.
        user_json_path (str): The path to the user JSON file.
        arch: Architecture for a particular software

    Returns:
        str or None: The file path for the JSON file if it exists, otherwise None.
    """
    base_path = os.path.dirname(os.path.abspath(user_json_path))
    json_path = os.path.join(base_path,
            f'{SOFTWARE_CONFIG_SUBDIR}/{arch}/{cluster_os_type}/{cluster_os_version}/{software_name}.json'
        )
    return json_path


def get_csv_file_path(software_name, user_csv_dir, arch):
    """
    Generates the absolute path of the CSV file based on the software name
    and the user-provided CSV directory.

    Parameters:
        software_name (str): The name of the software.
        user_csv_dir (str): The directory path where the CSV file is located.
            Expected to already include os_type/os_version (e.g., .../rhel/10.1).
        arch: Architecture of the software

    Returns:
        str: The absolute path of the CSV file if it exists, otherwise None.
    """
    status_csv_file_path = os.path.join(
          user_csv_dir, arch, software_name, DEFAULT_STATUS_FILENAME
        )
    return status_csv_file_path


def is_remote_url_reachable(remote_url, timeout=10,
                            client_cert=None, client_key=None, ca_cert=None):
    """
    Check if a remote URL is reachable with or without SSL client certs.
    If SSL certs are provided, the function will attempt to use them; otherwise,
    it defaults to a standard HTTP request.
    Args:
        remote_url (str): The URL to check for reachability.
        timeout (int, optional): The maximum number of seconds to wait for a response.
        Defaults to 10.
        client_cert (str, optional): Path to the client certificate file. Defaults to None.
        client_key (str, optional): Path to the client key file. Defaults to None.
        ca_cert (str, optional): Path to the CA certificate file. Defaults to None.
    Returns:
        bool: True if the URL is reachable (HTTP status 200), False otherwise.
    """
    try:
        # Check if SSL certs are provided and handle accordingly
        if client_cert and client_key and ca_cert:
            response = requests.get(
                remote_url,
                cert=(client_cert, client_key),
                verify=ca_cert,
                timeout=timeout
            )
        else:
            # Proceed with a regular HTTP request if no SSL certs are provided
            response = requests.get(remote_url, timeout=timeout)
        return response.status_code == 200
    except Exception:
        return False

def transform_package_dict(data, arch_val,logger):
    """
    Transforms a dictionary of packages and organizes them by architecture.

    Args:
        data (dict): Dictionary of packages where each key is a software name,
                     and each value is a list of package dicts.
        arch_val: Current architecture being parsed for the software
        logger (logging.Logger): Logger instance used for structured logging of process steps.

    Returns:
        dict: A dictionary where each key is an architecture (e.g., 'x86_64', 'aarch64'),
              and each value is a dictionary of software mapped to their transformed task list.
    """
    result = defaultdict(dict)

    for sw_name, items in data.items():
        transformed_items = []
        rpm_packages = []
        repo_mapping = {}

        for item in items:
            if item.get("type") in ("rpm", "rpm_repo"):
                rpm_packages.append(item["package"])
                # Preserve repo_name if available
                if "repo_name" in item:
                    repo_mapping[item["package"]] = item["repo_name"]
            elif item.get("type") == "rpm_list":
                rpm_packages.extend(item["package_list"])
                # Preserve repo_mapping if available
                if "repo_mapping" in item:
                    repo_mapping.update(item["repo_mapping"])
            else:
                transformed_items.append(item)

        if rpm_packages:
            rpm_task = {
                "package": RPM_LABEL_TEMPLATE.format(key=sw_name),
                "rpm_list": rpm_packages,
                "type": "rpm"
            }
            # Add repo_mapping if we have any
            if repo_mapping:
                rpm_task["repo_mapping"] = repo_mapping
            transformed_items.append(rpm_task)

        result[arch_val][sw_name] = transformed_items
        logger.info(f"Finished processing %s. Result: %s", sw_name, transformed_items)

    final_result = dict(result)
    logger.info("Transformation complete for arch '%s'. Final result keys: %s", arch_val, list(final_result.keys()))
    return final_result

def resolve_pulp_policy(policy_str, caching_val, logger=None):
    """
    Resolve user-facing policy and caching into Pulp download policy.
    Args:
        policy_str (str): User policy ('always', 'on_demand', 'partial').
        caching_val: Caching flag (bool, str 'true'/'false', or None).
        logger: Optional logger instance.
    Returns:
        str: Pulp download policy ('immediate', 'on_demand', 'streamed').
    """
    policy = str(policy_str).lower() if policy_str else DEFAULT_POLICY
    if isinstance(caching_val, str):
        caching = caching_val.lower() in ('true', '1', 'yes')
    elif isinstance(caching_val, bool):
        caching = caching_val
    else:
        caching = DEFAULT_CACHING
    pulp_policy = POLICY_CACHING_MAP.get(
        (policy, caching), "on_demand"
    )
    if logger:
        logger.info(
            f"Resolved policy='{policy}', caching={caching}"
            f" -> pulp_policy='{pulp_policy}'"
        )
    return pulp_policy

def parse_repo_urls(repo_config, local_repo_config_path,
                    version_variables, vault_key_path, sub_urls,logger,sw_archs=None):
    """
    Parses the repository URLs from the given local repository configuration file.
    Args:
        repo_config (str): Repo configuration
        local_repo_config_path (str): The path to the local repository configuration file.
        version_variables (dict): A dictionary of version variables.
        vault_key_path: Ansible vault key path
        sub_urls (dict): Mapping of architectures to subscription URLs that override 
                         default RHEL URLs when provided.
        logger (logging.Logger): Logger instance used for structured logging of process steps.
        sw_archs (list, optional): List of architectures to process based on software_config.json.
                                   If None, defaults to ARCH_SUFFIXES.
    Returns:
        tuple: A tuple where the first element is either the parsed repository URLs as a JSON string
               (on success) or the rendered URL (if unreachable),
                and the second element is a boolean
               indicating success (True) or failure (False).
        str: The parsed repository URLs as a JSON string.
    """
    local_yaml = load_yaml(local_repo_config_path)
    repo_entries = {}
    user_repo_entry = {}
    rhel_repo_entry = {}

    archs_to_process = sw_archs if sw_archs else ARCH_SUFFIXES
    logger.info(f"Processing repository URLs for architectures: {archs_to_process}")

    for arch in archs_to_process:

        # Always ensure these are lists
        rhel_repo_entry[arch] = list(local_yaml.get(f"rhel_os_url_{arch}") or [])
        repo_entries[arch] = list(local_yaml.get(f"omnia_repo_url_rhel_{arch}") or [])
        user_repo_entry[arch] = list(local_yaml.get(f"user_repo_url_{arch}") or [])
        # In case of Subscription, Subscription URLs take precedence if present and non-empty
        if sub_urls and arch in sub_urls and sub_urls[arch]:
            logger.info(f"Subscription URLs detected for arch {arch}. Overriding RHEL URLs.")
            if not isinstance(rhel_repo_entry.get(arch), list):
                rhel_repo_entry[arch] = []
            rhel_repo_entry[arch] = list(sub_urls[arch])
            logger.info(f" Updated RHEL URLs: {rhel_repo_entry[arch]}")

    parsed_repos = []
    vault_key_path = os.path.join(
        vault_key_path, ".local_repo_credentials_key")

    # Handle user repositories
    for arch, repo_list in user_repo_entry.items():
        if not repo_list:
            logger.info(f"No user repository entries found for {arch}")
            continue
        for url_ in repo_list:
            name = url_.get("name", "unknown")
            url = url_.get("url", "")
            gpgkey = url_.get("gpgkey", "")
            ca_cert = url_.get("sslcacert", "")
            client_key = url_.get("sslclientkey", "")
            client_cert = url_.get("sslclientcert", "")
            policy_given = url_.get("policy", repo_config)
            caching_given = url_.get("caching", True)
            policy = resolve_pulp_policy(
                policy_given, caching_given, logger
            )

            logger.info(f"Processing user repo '{name}' for arch '{arch}' - URL: {url}")

            for path in [ca_cert, client_key, client_cert]:
                mode = "decrypt"
                if path and is_encrypted(path):
                    result, message = process_file(path, vault_key_path, mode)
                    if result is False:
                        logger.error(f"Decryption failed for user repo path: {path} | Error: {message}")
                        return f"Error during decrypt for user repository path:{path}", False

            if not is_remote_url_reachable(url, client_cert=client_cert,
                                           client_key=client_key, ca_cert=ca_cert):
                logger.error(f"User repo URL unreachable: {url}")
                return url, False

            parsed_repos.append({
                "package": name,
                "url": url,
                "gpgkey": gpgkey if gpgkey else "null",
                "version": "null",
                "ca_cert": ca_cert,
                "client_key": client_key,
                "client_cert": client_cert,
                "policy": policy,
                "sw_arch": arch
            })

            logger.info(f"Added user repo entry: {name}")

    # Handle RHEL repositories (includes subscription-based repos)
    for arch, repo_list in rhel_repo_entry.items():
        for url_ in repo_list:
            name = url_.get("name", "unknown")
            url = url_.get("url", "")
            gpgkey = url_.get("gpgkey", "")
            ca_cert = url_.get("sslcacert", "")
            client_key = url_.get("sslclientkey", "")
            client_cert = url_.get("sslclientcert", "")
            policy_given = url_.get("policy", repo_config)
            caching_given = url_.get("caching", True)
            policy = resolve_pulp_policy(
                policy_given, caching_given, logger
            )

            logger.info(f"Processing RHEL repo '{name}' for arch '{arch}' - URL: {url}")

            for path in [ca_cert, client_key, client_cert]:
                mode = "decrypt"
                if path and is_encrypted(path):
                    result, message = process_file(path, vault_key_path, mode)
                    if result is False:
                        logger.error(f"Decryption failed for RHEL repo path: {path} | Error: {message}")
                        return f"Error during decrypt for rhel repository path:{path}", False

            if not is_remote_url_reachable(url, client_cert=client_cert,
                                           client_key=client_key, ca_cert=ca_cert):
                logger.error(f"RHEL repo URL unreachable: {url}")
                return url, False

            # if not is_remote_url_reachable(url):
            #     return url, False

            parsed_repos.append({
                "package": name,
                "url": url,
                "gpgkey": gpgkey if gpgkey else "null",
                "version": "null",
                "ca_cert": ca_cert,
                "client_key": client_key,
                "client_cert": client_cert,
                "policy": policy,
                "sw_arch": arch
            })
            logger.info(f"Added RHEL repo entry: {name}")

    # Handle OMNIA repositories
    seen_urls = set()
    for arch, entries in repo_entries.items():
        if not entries:
            logger.info(f"No OMNIA repository entries found for {arch}")
            continue

        for repo in entries:
            name = repo.get("name", "unknown")
            url = repo.get("url", "")
            gpgkey = repo.get("gpgkey", "")
            policy_given = repo.get("policy", repo_config)
            caching_given = repo.get("caching", True)
            policy = resolve_pulp_policy(
                policy_given, caching_given, logger
            )
            logger.info(f"Processing OMNIA repo '{name}' for arch '{arch}' - Template URL: {url}")

            # Find unresolved template vars in URL
            template_vars_url = re.findall(r"{{\s*(\w+)\s*}}", url)
            unresolved_url = [var for var in template_vars_url if var not in version_variables]
            if unresolved_url:
                logger.info(f"Unresolved template vars in URL '{url}': {unresolved_url}")
                continue

            try:
                rendered_url = Template(url).render(version_variables)
            except Exception:
                logger.error(f"Failed to render URL template '{url}' | Error: {e}")
                rendered_url = url  # fallback

            if rendered_url in seen_urls:
                logger.info(f"Skipping duplicate URL: {rendered_url}")
                continue
            seen_urls.add(rendered_url)

            # # Skip reachability check for URLs containing k8s, cri-o, oneapi, snoopy, nvidia
            if not any(skip_str in rendered_url for skip_str in ["k8s", "cri-o", "oneapi", "snoopy", "nvidia"]):
                if not is_remote_url_reachable(rendered_url):
                    logger.error(f"OMNIA repo URL unreachable: {rendered_url}")
                    return rendered_url, False

            # Handle gpgkey rendering (if present)
            rendered_gpgkey = "null"
            if gpgkey:
                template_vars_gpg = re.findall(r"{{\s*(\w+)\s*}}", gpgkey)
                unresolved_gpg = [var for var in template_vars_gpg if var not in version_variables]
                if unresolved_gpg:
                    continue

                try:
                    rendered_gpgkey = Template(gpgkey).render(version_variables)
                except Exception:
                    rendered_gpgkey = gpgkey  # fallback to original

            sw_name = f"{arch}_{name}"
            version = "null"
            for var in template_vars_url:
                if var in version_variables:
                    version = version_variables[var]
                    break

            parsed_repos.append({
                "package": sw_name,
                "url": rendered_url,
                "gpgkey": rendered_gpgkey,
                "version": version if version else "null",
                "policy": policy,
                "sw_arch": arch
            })
            logger.info(f"Added OMNIA repo entry: {arch}_{name}")

    logger.info(f"Successfully parsed {len(parsed_repos)} repository entries.")
    return parsed_repos, True

def set_version_variables(user_data, software_names, cluster_os_version,logger):
    """
    Generates a dictionary of version variables from the user data.
    Args:
        user_data (dict): The user data containing the software information.
        software_names (list): The list of software names to extract versions for.
        cluster_os_version (str): The version of the cluster operating system.
        logger (logging.Logger): Logger instance used for structured logging of process steps.
    Returns:
        dict: A dictionary of version variables, where the keys are the software names
              and the values are the corresponding versions.
    """
    version_variables = {}

    for software in user_data.get(SOFTWARES_KEY, []):
        name = software.get('name')
        if name in software_names and 'version' in software:
            version_variables[f"{name}_version"] = software['version']
            logger.info("Added version variable from SOFTWARES_KEY: %s = %s", f"{name}_version", software['version'])

    for key in software_names:
        for item in user_data.get(key, []):
            name = item.get('name')
            if 'version' in item:
                version_variables[f"{name}_version"] = item['version']

    version_variables["cluster_os_version"] = cluster_os_version
    logger.info("Added cluster_os_version: %s", cluster_os_version)

    logger.info("Version variables generated: %s", version_variables)
    return version_variables


def get_subgroup_dict(user_data,logger):
    """
    Returns a tuple containing a dictionary mapping software names to subgroup lists,
    and a list of software names.
    """
    logger.info("Starting get_subgroup_dict()")
    subgroup_dict = {}
    software_names = []

    for sw in user_data.get(SOFTWARES_KEY, []):
        software_name = sw['name']
        software_names.append(software_name)
        subgroups = [sw['name']] + [item['name']
                                    for item in user_data.get(software_name, [])]
        subgroup_dict[software_name] = subgroups if isinstance(
            user_data.get(software_name), list) else [sw['name']]

    logger.info("Completed get_subgroup_dict(). Found %d software entries.", len(software_names))
    logger.info("Final subgroup_dict: %s", subgroup_dict)

    return subgroup_dict, software_names


def get_csv_software(file_name):

    """
    Retrieves a list of software names from a CSV file.
    Parameters:
        file_name (str): The name of the CSV file.
    Returns:
        list: A list of software names.
    """

    csv_software = []

    if not os.path.isfile(file_name):
        return csv_software

    with open(file_name, mode='r') as csv_file:
        reader = csv.DictReader(csv_file)
        csv_software = [row.get(CSV_COLUMNS["column1"], "").strip()
                        for row in reader]

    return csv_software


def get_failed_software(file_path):
    """
    Retrieves a list of failed software from a CSV file.

    Parameters:
        file_path (str): The filepath of the status.csv file.

    Returns:
        list: A list of software names that failed.
    """
    failed_software = []

    if not os.path.isfile(file_path):
        return failed_software

    with open(file_path, mode='r') as csv_file:
        reader = csv.DictReader(csv_file)
        failed_software = [
            str(row.get(CSV_COLUMNS["column1"]) or "").strip()
            for row in reader
            if str(row.get(CSV_COLUMNS["column2"]) or "").strip().lower() in ["", "failed"]
    ]
    return failed_software

def _sanitize_shell_arg(value, logger, field_name="value"):
    """
    Sanitize a value before using it in a shell command to prevent argument injection.

    Validates the value against a strict allowlist of characters that are safe
    for shell interpolation, then applies shlex.quote for safe shell escaping.

    Args:
        value (str): The value to sanitize.
        logger (logging.Logger): Logger instance.
        field_name (str): Name of the field being sanitized (for logging).

    Returns:
        str: The sanitized, shell-quoted value.

    Raises:
        ValueError: If the value contains disallowed characters.
    """
    if not isinstance(value, str) or not value:
        raise ValueError(f"Invalid {field_name}: must be a non-empty string")
    value = value.strip().strip('"')
    safe_pattern = re.compile(r'^[a-zA-Z0-9._\-/:@=?&\[\]]+$')
    if not safe_pattern.match(value):
        logger.error("Potentially unsafe characters detected in %s: %s", field_name, value)
        raise ValueError(
            f"Invalid {field_name}{value}: contains disallowed characters. "
            f"Only alphanumeric characters and ._-/:@=?&[] are allowed."
        )
    return shlex.quote(value)


def check_additional_image_in_pulp(image_entry, logger):
    """
    Checks if image present in additional_packages.json is configured in Pulp.
    """
    image_name = image_entry.get("package")
    image_tag = image_entry.get("tag", None)
    image_digest = image_entry.get("digest", None)

    logger.info("Checking if %s is present in Pulp", image_name)

    _sanitize_shell_arg(image_name, logger, "image_name")

    dist_name_prefix = "container_repo_"
    transformed_dist_name = (f"{dist_name_prefix}{image_name.replace('/', '_').replace(':', '_')}")

    repo_href_result = None
    latest_version_href_result = None
    tags_output_result = None

    show_dist_cmd = (pulp_container_commands["container_distribution_show"] % shlex.quote(transformed_dist_name))
    repo_href_result = execute_command(show_dist_cmd, logger)
    logger.info("repo_href_result: %s", repo_href_result)

    if repo_href_result.get("stderr") and "Error:" in repo_href_result.get("stderr", ""):
        logger.info("Distribution %s not found in Pulp", transformed_dist_name)
        return {
            "type": "image",
            "package": image_name,
            "tag": image_tag,
        }
    else:
        logger.info("Distribution %s found in Pulp", transformed_dist_name)
        repo_href = repo_href_result["stdout"]
        repo_href = _sanitize_shell_arg(repo_href, logger, "repo_href")
        show_repo_cmd = (pulp_container_commands["show_repository_version"] % repo_href)
        latest_version_href_result = execute_command(show_repo_cmd, logger)
        logger.info("latest_version_href_result: %s", latest_version_href_result)
        if latest_version_href_result.get("stderr") and "Error:" in latest_version_href_result.get("stderr", ""):
            logger.info("No repository version found. Empty repository")
            return {
                "type": "image",
                "package": image_name,
                "tag": image_tag,
            }
        else:
            logger.info("Repository version found in Pulp")
            latest_version_href = latest_version_href_result["stdout"]
            latest_version_href = _sanitize_shell_arg(latest_version_href, logger, "latest_version_href")
            show_tags_cmd = (pulp_container_commands["list_image_tags"] % latest_version_href)
            tags_output_result = execute_command(show_tags_cmd, logger, type_json=True)
            logger.info("tags_output_result: %s", tags_output_result)
            if tags_output_result.get("stderr") and "Error:" in tags_output_result.get("stderr", ""):
                logger.info("No tags found for %s", image_name)
                return {
                    "type": "image",
                    "package": image_name,
                    "tag": image_tag,
                }
            else:
                logger.info("Tags found for %s", image_name)
                tag_names = [tag["name"] for tag in tags_output_result.get("stdout", {}).get("results", [])]
                logger.info("tag_names: %s", tag_names)
                if image_tag and image_tag not in tag_names:
                    logger.info("Tag %s not found for image %s in Pulp", image_tag, image_name)
                    return {
                        "type": "image",
                        "package": image_name,
                        "tag": image_tag,
                    }
                elif image_digest and image_digest not in tag_names:
                    logger.info("Digest %s not found for image %s in Pulp", image_digest, image_name)
                    return {
                        "type": "image",
                        "package": image_name,
                        "tag": image_digest,
                    }
                else:
                    logger.info("No download required as image is already present in Pulp")
                    return {}

def parse_json_data(file_path, package_types,logger, failed_list=None, subgroup_list=None):
    """
    Retrieves a filtered list of items from a JSON file.

    Parameters:
        file_path (str): The path to the JSON file.
        package_types (list): A list of package types to filter.
        logger (logging.Logger): Logger instance used for structured logging of process steps.
        failed_list (list, optional): A list of failed packages. Defaults to None.
        subgroup_list (list, optional): A list of subgroups to filter. Defaults to None.

    Returns:
        list: The filtered list of items.
    """
    logger.info("Starting parse_json_data() for file: %s", file_path)
    try:
        data = load_json(file_path)
        logger.info("Successfully loaded JSON file: %s", file_path)
    except Exception as e:
        logger.error("Failed to load JSON file '%s': %s", file_path, e)
        raise

    filtered_list = []

    # Check if file name is additional_packages.json
    is_additional_packages = file_path.endswith("additional_packages.json")
    logger.info("additional_packages present: %s", is_additional_packages)

    for key, package in data.items():
        if subgroup_list is None or key in subgroup_list:
            for value in package.values():
                for item in value:
                    # For every image, check if it is present in Pulp
                    if is_additional_packages and item.get("type") == "image":
                        logger.info("Calling function to check %s existence in Pulp", item)
                        tag_missing_entry = check_additional_image_in_pulp(item, logger)
                        logger.info("tag_missing_entry: %s", tag_missing_entry)
                        if tag_missing_entry == {}:
                            continue
                        if tag_missing_entry:
                            filtered_list.append(tag_missing_entry)
                        continue

                    # Get package name
                    pkg_name = item.get("package")

                    # Construct possible match keys based on available fields
                    match_keys = {pkg_name}  # Base case: package name only

                    if "tag" in item and item["tag"]:
                        # Add package:tag
                        match_keys.add(f"{pkg_name}:{item['tag']}")

                    if "digest" in item and item["digest"]:
                        # Add package:digest
                        match_keys.add(f"{pkg_name}:{item['digest']}")

                    # Apply filtering
                    if item.get("type") in package_types and (failed_list is None or any(match in failed_list for match in match_keys)):
                        filtered_list.append(item)

    logger.info("Final filtered list: %s", filtered_list)
    return filtered_list


def check_csv_existence(path):
    """
    Checks if a CSV file exists at the given path.

    Parameters:
        path (str): The path to the CSV file.

    Returns:
        bool: True if the CSV file exists, False otherwise.
    """
    if isinstance(path, str):
        return os.path.isfile(path)

def read_status_csv(csv_path):
    """Reads the status.csv file and returns a list of row dictionaries."""
    with open(csv_path, mode='r', newline='') as file:
        reader = csv.DictReader(file)
        return [row for row in reader]

def get_new_packages_not_in_status(json_path, csv_path, subgroup_list,logger):
    """
    Reads packages from a JSON file and status rows from a CSV file,
    then returns packages from JSON that are not present in the CSV.
    Handles grouped RPM entries like 'RPMs for <group>'.
    
    Parameters:
        json_path (str): Path to JSON file containing 'all_input_packages'.
        csv_path (str): Path to CSV file containing status rows.
        subgroup_list (list, optional): A list of subgroups to filter. Defaults to None.
        logger (logging.Logger): Logger instance used for structured logging of process steps.
    
    Returns:
        list: List of new packages not in the status CSV.
    """

    all_packages = []
    new_packages = []

    try:
        status_csv_content = read_status_csv(csv_path)
        logger.info("Successfully read status CSV: %s", csv_path)
    except Exception as e:
        logger.error("Failed to read CSV file '%s': %s", csv_path, e)
        raise

    names = [row['name'] for row in status_csv_content]
    # Read all packages from JSON
    try:
        all_packages = parse_json_data(json_path, PACKAGE_TYPES, logger,None, subgroup_list)
        logger.info("Total packages loaded from JSON: %d", len(all_packages))
    except Exception as e:
        logger.error("Failed to parse JSON file '%s': %s", json_path, e)
        raise

    for pkg in all_packages:
        if pkg["type"] == "image":
            # Check exact package:tag or package:digest combination
            pkg_base = pkg.get("package", "").strip()
            pkg_identifier = pkg_base

            if "tag" in pkg:
                pkg_identifier += f":{pkg['tag']}"
            elif "digest" in pkg:
                pkg_identifier += f":{pkg['digest']}"

            if pkg_identifier not in names:
                new_packages.append(pkg)
        else:
            if pkg.get("package") not in names:
                new_packages.append(pkg)
    logger.info("New packages list: %s", new_packages)

    logger.info("Finished get_new_packages_not_in_status()")

    return new_packages

def process_software(software, fresh_installation, json_path, csv_path, subgroup_list,logger):
    """
    Processes the given software by parsing JSON data and returning a filtered list of items.
 
    Parameters:
        software (str): The name of the software.
        fresh_installation (bool): Indicates whether it is a fresh installation.
        json_path (str): The path to the JSON file.
        csv_path (str): The path to the CSV file.
        subgroup_list (list, optional): A list of subgroups to filter. Defaults to None.
        logger (logging.Logger): Logger instance used for structured logging of process steps.
 
    Returns:
        list: The filtered list of items.
    """
    # Determine failed packages
    if fresh_installation:
        failed_packages = None
        logger.info("Fresh installation detected — skipping failed package check.")
    else:
        try:
            failed_packages = None if fresh_installation else get_failed_software(csv_path)
            logger.info("Failed packages: %s", failed_packages)
        except Exception as e:
            logger.error("Failed to retrieve failed packages from '%s': %s", csv_path, e)
            raise
    rpm_package_type = ['rpm']
    rpm_tasks = []
    if failed_packages is not None and any("RPMs" in software for software in failed_packages):
        logger.info("Detected failed RPM packages for software: %s", software)
        try:
            rpm_tasks = parse_json_data(
                json_path, rpm_package_type, logger, None, subgroup_list)
        except Exception as e:
            logger.error("Error parsing RPM JSON data from '%s': %s", json_path, e)
            raise
    else:
        logger.info("No failed RPM packages found for: %s", software)

    # Parse main JSON data
    try:
        combined = parse_json_data(
            json_path, PACKAGE_TYPES,logger,failed_packages, subgroup_list) + rpm_tasks
        logger.info("Successfully parsed JSON data for %s. Total combined tasks: %d",software, len(combined))
    except Exception as e:
        logger.error("Error parsing main JSON data for '%s': %s", software, e)
        raise

    logger.info("Completed process_software() for %s", software)
    logger.info("Final combined tasks: %s", combined)

    return combined, failed_packages

def get_software_names(json_file_path):
    with open(json_file_path, "r") as f:
        data = json.load(f)

    softwares = data.get("softwares", [])
    return softwares

def get_software_names_and_arch(json_data, arch):
    softwares = json_data.get("softwares", [])
    result = []
    sw_arch_dict = {}

    for sw in softwares:
        sw_arch_dict = get_arch_from_sw_config(sw["name"],json_data)
        sw_arch = sw_arch_dict[sw["name"]]
        if arch in sw_arch:
            result.append(sw["name"])

    return result

def remove_duplicates_from_trans(trans):
    """
    Remove duplicate software entries from the transform output.
    The function modifies the input `trans` dictionary in-place and also returns it.
    Args:
        trans (dict): Dictionary returned from `transform_package_dict()` containing
                      architecture → software groups → package lists.
    Returns:
        dict: Deduplicated `trans` dictionary with unique package entries preserved.
    """

    for arch, groups in trans.items():
        for group, items in groups.items():

            if group == "default_packages":  # Handle nested rpm_list case
                for pkg in items:
                    if pkg.get("type") in ("rpm", "rpm_repo") and "rpm_list" in pkg:
                        pkg["rpm_list"] = list(dict.fromkeys(pkg["rpm_list"]))
                continue

            unique = {}
            cleaned = []

            for item in items:
                type_ = item.get("type")

                if type_ == "image":
                    # Use digest if present, otherwise use tag
                    identifier = item.get("digest") or item.get("tag")
                    key = (item.get("package"), identifier)

                elif type_ == "pip_module":
                    key = item.get("package")

                elif type_ in ["tarball", "manifest"]:
                    key = item.get("url") or item.get("package")

                elif type_ == "git":
                    key = (item.get("url"), item.get("version"))

                elif type_ in ("rpm", "rpm_repo") and "rpm_list" in item:
                    item["rpm_list"] = list(dict.fromkeys(item["rpm_list"]))
                    key = item.get("package")

                else:
                    key = str(item)

                if key not in unique:
                    unique[key] = True
                    cleaned.append(item)

            groups[group] = cleaned

    return trans


def parse_additional_repos(local_repo_config_path, repo_config, vault_key_path, logger):
    """
    Parses additional repository URLs from the local repository configuration file.
    These repos are aggregated into a single Pulp repository per architecture.

    Args:
        local_repo_config_path (str): The path to the local repository configuration file.
        repo_config (str): Global repo configuration policy from software_config.json.
        vault_key_path (str): Ansible vault key path for decrypting SSL certificates.
        logger (logging.Logger): Logger instance for structured logging.

    Returns:
        tuple: (additional_repos_config, error_message)
            - additional_repos_config (dict): Dictionary with arch as key and list of repo configs as value.
            - error_message (str or None): Error message if validation fails, None otherwise.
    """
    logger.info("Starting parse_additional_repos()")
    local_yaml = load_yaml(local_repo_config_path)

    additional_repos_config = {}
    global_policy = resolve_pulp_policy(
        repo_config, True, logger
    )

    vault_key_full_path = os.path.join(vault_key_path, ".local_repo_credentials_key")

    for arch in ARCH_SUFFIXES:
        key = f"{ADDITIONAL_REPOS_KEY}_{arch}"
        repo_list = local_yaml.get(key) or []

        if not repo_list:
            logger.info(f"No additional repos found for {arch}")
            additional_repos_config[arch] = []
            continue

        # Validate for duplicate names within this arch
        names_seen = set()
        for repo in repo_list:
            name = repo.get("name", "")
            if name in names_seen:
                error_msg = f"Duplicate name '{name}' found in {key}. Each repo must have a unique name."
                logger.error(error_msg)
                return None, error_msg
            names_seen.add(name)

        parsed_repos = []
        for repo in repo_list:
            name = repo.get("name", "unknown")
            url = repo.get("url", "")
            gpgkey = repo.get("gpgkey", "")
            ca_cert = repo.get("sslcacert", "")
            client_key = repo.get("sslclientkey", "")
            client_cert = repo.get("sslclientcert", "")

            logger.info(f"Processing additional repo '{name}' for arch '{arch}' - URL: {url}")

            # Decrypt SSL certificates if encrypted
            for path in [ca_cert, client_key, client_cert]:
                if path and is_encrypted(path):
                    result, message = process_file(path, vault_key_full_path, "decrypt")
                    if result is False:
                        error_msg = f"Decryption failed for additional repo path: {path} | Error: {message}"
                        logger.error(error_msg)
                        return None, error_msg

            # Check URL reachability
            if not is_remote_url_reachable(url, client_cert=client_cert,
                                           client_key=client_key, ca_cert=ca_cert):
                error_msg = f"Additional repo URL unreachable: {url}"
                logger.error(error_msg)
                return None, error_msg

            parsed_repos.append({
                "name": name,
                "url": url,
                "gpgkey": gpgkey if gpgkey else "",
                "ca_cert": ca_cert,
                "client_key": client_key,
                "client_cert": client_cert,
                "policy": global_policy,
                "arch": arch
            })
            logger.info(f"Added additional repo entry: {name}")

        additional_repos_config[arch] = parsed_repos

    logger.info(f"Successfully parsed additional repos. x86_64: {len(additional_repos_config.get('x86_64', []))}, "
                f"aarch64: {len(additional_repos_config.get('aarch64', []))}")
    return additional_repos_config, None


def validate_additional_repos_names(local_repo_config_path, logger):
    """
    Validates that names in additional_repos_* do not conflict with names in other repo keys.

    Args:
        local_repo_config_path (str): The path to the local repository configuration file.
        logger (logging.Logger): Logger instance for structured logging.

    Returns:
        tuple: (is_valid, error_message)
            - is_valid (bool): True if validation passes, False otherwise.
            - error_message (str or None): Error message if validation fails, None otherwise.
    """
    logger.info("Starting validate_additional_repos_names()")
    local_yaml = load_yaml(local_repo_config_path)

    # Keys to check for conflicts
    other_repo_keys = {
        "x86_64": ["user_repo_url_x86_64", "rhel_os_url_x86_64", "omnia_repo_url_rhel_x86_64"],
        "aarch64": ["user_repo_url_aarch64", "rhel_os_url_aarch64", "omnia_repo_url_rhel_aarch64"]
    }

    for arch in ARCH_SUFFIXES:
        additional_key = f"{ADDITIONAL_REPOS_KEY}_{arch}"
        additional_repos = local_yaml.get(additional_key) or []

        if not additional_repos:
            continue

        # Get all names from additional_repos for this arch
        additional_names = {repo.get("name", "") for repo in additional_repos if repo.get("name")}

        # Check against other repo keys for the same arch
        for other_key in other_repo_keys.get(arch, []):
            other_repos = local_yaml.get(other_key) or []
            for repo in other_repos:
                other_name = repo.get("name", "")
                if other_name in additional_names:
                    error_msg = (f"Name '{other_name}' in {additional_key} conflicts with "
                                 f"existing repo name in {other_key}. Please use a unique name.")
                    logger.error(error_msg)
                    return False, error_msg

    logger.info("Additional repos name validation passed.")
    return True, None


================================================
FILE: common/library/module_utils/local_repo/standard_logger.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""
File to setup standard logger
"""

import os
import logging
import threading
import queue
import time

def setup_standard_logger(log_dir, log_filename="standard.log"):
    """
    Sets up a standard logger to log to a specified file.
 
    Parameters:
        log_dir (str): The directory where the log file will be saved.
        log_filename (str, optional): The name of the log file. Defaults to "standard.log".
 
    Returns:
        logging.Logger: The configured logger instance.
    """
    # Ensure the log directory exists
    os.makedirs(log_dir, exist_ok=True)

    log_filepath = os.path.join(log_dir, log_filename)

    # Create a logger
    logger = logging.getLogger("task_logger")
    logger.setLevel(logging.DEBUG)

    # Create file handler and set level to debug
    file_handler = logging.FileHandler(log_filepath)
    file_handler.setLevel(logging.DEBUG)

    # Create a console handler for error-level logging to stdout
    console_handler = logging.StreamHandler()
    console_handler.setLevel(logging.ERROR)

    # Create formatter and add it to handlers
    formatter = logging.Formatter("%(asctime)s - %(levelname)s - %(filename)s:%(lineno)d - %(funcName)s() - %(message)s",
    datefmt="%Y-%m-%d %H:%M:%S")
    file_handler.setFormatter(formatter)
    console_handler.setFormatter(formatter)

    # Add handlers to logger
    logger.addHandler(file_handler)
    logger.addHandler(console_handler)

    return logger


================================================
FILE: common/library/module_utils/local_repo/user_image_utility.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# pylint: disable=import-error,no-name-in-module

import json
import requests
from requests.auth import HTTPBasicAuth
from jinja2 import Template
from ansible.module_utils.local_repo.standard_logger import setup_standard_logger
from ansible.module_utils.local_repo.parse_and_download import execute_command
from ansible.module_utils.local_repo.config import (
    pulp_container_commands
)
from ansible.module_utils.local_repo.container_repo_utils import (
    create_container_repository,
    sync_container_repository,
    extract_existing_tags,
    remote_creation_lock,
    repository_creation_lock
)

def check_image_in_registry(
    host,
    image,
    tag,
    cacert=None,
    key=None,
    username=None,
    password=None,
    logger=None,
):
    """
    Check if a container image exists in a user registry using Docker Registry HTTP API v2.

    Args:
        host (str): Registry hostname (without protocol)
        image (str): Image name
        tag (str): Image tag
        cacert (str, optional): Path to the CA certificate file for TLS authentication
        key (str, optional): Path to the client key file for TLS authentication
        username (str, optional): Registry username for basic authentication
        password (str, optional): Registry password for basic authentication
        logger (logging.Logger, optional): Logger instance for logging messages

    Returns:
        bool: True if image exists, False otherwise
    """

    if not host.startswith(("http://", "https://")):
        # Checkmarx: Communication_Over_HTTP
        # HTTP is intentionally allowed here because this function must support
        # insecure user registries.
        protocol = "https" if (cacert and key) else "http"
        host = f"{protocol}://{host}"
    image_url = f"{host}/v2/{image}/manifests/{tag}"
    logger.info(f"Checking image existence at: {image_url}")

    try:
        request_args = {
            "timeout": 10,
            "verify": False,
            "headers": {
                "Accept": (
                    "application/vnd.oci.image.manifest.v1+json,"
                    "application/vnd.oci.image.index.v1+json,"
                    "application/vnd.docker.distribution.manifest.v2+json,"
                    "application/vnd.docker.distribution.manifest.list.v2+json"
                )
            },
        }

        if cacert and key:
            request_args["cert"] = (cacert, key)

        response = requests.get(image_url, **request_args)

        if response.status_code == 200:
            logger.info(f"Image '{image}:{tag}' exists in registry '{host}'")
            return True

        if response.status_code == 404:
            logger.info(
                f"Image '{image}:{tag}' does not exist in registry '{host}'"
            )
            return False

        logger.error(
            f"Unexpected HTTP {response.status_code} while checking image "
            f"'{image}:{tag}' in registry '{host}'"
        )

    except requests.exceptions.SSLError as e:
        logger.error(
            f"TLS error while connecting to registry '{host}': {e}"
        )
    except requests.RequestException as e:
        logger.exception(f"Network error while checking image: {e}")
    except Exception as e:
        logger.exception(f"Unexpected error while checking image: {e}")

    return False

def create_user_remote_container(
    remote_name,
    base_url,
    package_content,
    policy_type,
    cacert,
    key,
    logger,
    tag_val=None,
):
    """
    Creates or updates a container remote in Pulp using either digest or tag logic.

    Args:
        remote_name (str): Name of the container remote.
        base_url (str): Base URL of the remote registry.
        package_content (str): Identifier for the container package.
        policy_type (str): Remote policy (e.g., 'immediate', 'on_demand').
        cacert (str): Path to the CA certificate for TLS authentication.
        key (str): Path to the client key for TLS authentication.
        logger (logging.Logger): Logger for recording actions and errors.
        tag_val (str, optional): Optional tag to include in the remote configuration.

    Returns:
        bool or dict: True on success, False on failure, or a dict with command result.
    """
    try:
        if tag_val is None:
            remote_exists = execute_command(
                pulp_container_commands["show_container_remote"] % remote_name, logger
            )
            if not remote_exists:
                if cacert and key:
                    ca_cert = f"@{cacert}"
                    client_key = f"@{key}"
                    command = pulp_container_commands["create_user_remote_digest"] % (
                        remote_name,
                        base_url,
                        package_content,
                        policy_type,
                        ca_cert,
                        client_key,
                    )
                else:
                    command = pulp_container_commands["create_container_remote_for_digest"] % (
                        remote_name,
                        base_url,
                        package_content,
                        policy_type,
                    )
                result = execute_command(command, logger)
                logger.info(f"Remote created successfully: {remote_name}")
                return result

            logger.info(f"Remote {remote_name} already exists.")
            if cacert and key:
                ca_cert = f"@{cacert}"
                client_key = f"@{key}"
                command = pulp_container_commands["update_user_remote_digest"] % (
                    remote_name,
                    base_url,
                    package_content,
                    policy_type,
                    ca_cert,
                    client_key,
                )
            else:
                command = pulp_container_commands["update_remote_for_digest"] % (
                    remote_name,
                    base_url,
                    package_content,
                    policy_type,
                )
            result = execute_command(command, logger)
            logger.info(f"Remote updated successfully: {remote_name}")
            return result

        # tag_val is provided
        remote_exists = execute_command(
            pulp_container_commands["show_container_remote"] % remote_name, logger
        )

        if not remote_exists:
            if cacert and key:
                ca_cert = f"@{cacert}"
                client_key = f"@{key}"
                command = pulp_container_commands["create_user_remote_tag"] % (
                    remote_name,
                    base_url,
                    package_content,
                    policy_type,
                    tag_val,
                    ca_cert,
                    client_key,
                )
            else:
                command = pulp_container_commands["create_container_remote"] % (
                    remote_name,
                    base_url,
                    package_content,
                    policy_type,
                    tag_val,
                )
            result = execute_command(command, logger)
            if result:
                logger.info(f"Remote '{remote_name}' created successfully.")
                return True

            logger.error(f"Failed to create remote '{remote_name}'.")
            return False

        logger.info(f"Remote '{remote_name}' already exists. Updating include_tags.")
        existing_tags = extract_existing_tags(remote_name, logger)

        if tag_val in existing_tags:
            logger.info(
                f"Tag '{tag_val}' already exists for remote '{remote_name}'. No update needed."
            )
            return True

        new_tags = existing_tags + [tag_val]
        tags_json = json.dumps(new_tags)

        if cacert and key:
            ca_cert = f"@{cacert}"
            client_key = f"@{key}"
            update_command = pulp_container_commands["update_user_remote_tag"] % (
                remote_name,
                base_url,
                package_content,
                policy_type,
                tags_json,
                ca_cert,
                client_key,
            )
        else:
            update_command = pulp_container_commands["update_container_remote"] % (
                remote_name,
                base_url,
                package_content,
                policy_type,
                tags_json,
            )
        result = execute_command(update_command, logger)

        if result:
            logger.info(f"Remote '{remote_name}' updated successfully with tags: {new_tags}")
            return True

        logger.error(f"Failed to update remote '{remote_name}'.")
        return False

    except Exception as e:
        logger.error(f"Failed to create remote {remote_name}. Error: {e}")
        return False


def process_user_registry(
    package,
    host,
    package_content,
    version_variables,
    cacert,
    key,
    logger,
):
    """
    Sets up and syncs a user container image repository using a tag or digest.

    Args:
        package (dict): Package metadata with 'package', and either 'tag' or 'digest'.
        host (str): Registry host URL.
        package_content (str): Image name to process.
        version_variables (dict): Variables to render the tag if templated.
        logger (Logger): Logger for debug and error output.

    Returns:
        tuple: (bool success, str image_identifier)
    """
    logger.info("#" * 30 + f" {process_user_registry.__name__} start " + "#" * 30)

    user_reg_prefix = "container_repo_"
    repository_name = (
        f"{user_reg_prefix}{package['package'].replace('/', '_').replace(':', '_')}"
    )
    remote_name = f"user_remote_{package['package'].replace('/', '_').replace(':', '_')}"
    package_identifier = package["package"]
    policy_type = "immediate"
    if not host.startswith(("http://", "https://")):
        protocol = "https" if (cacert and key) else "http"
        host = f"{protocol}://{host}"
    base_url = f"{host}/"

    logger.info("Creating user container repository")
    with repository_creation_lock:
        result = create_container_repository(repository_name, logger)

    if result is False or (isinstance(result, dict) and result.get("returncode", 1) != 0):
        return False, package_identifier

    logger.info("Creating user registry remote")

    if "digest" in package:
        package_identifier += f":{package['digest']}"
        result = create_user_remote_container(
            remote_name, base_url, package_content, policy_type, cacert, key, logger
        )
        if result is False or (isinstance(result, dict) and result.get("returncode", 1) != 0):
            return False, package_identifier

    elif "tag" in package:
        tag_val = package["tag"]
        if "{{" in tag_val and "}}" in tag_val:
            try:
                template = Template(tag_val)
                tag_val = template.render(**version_variables)
            except Exception as exc:
                logger.error(f"Failed to render tag template: {exc}")
                return False, package_identifier

        with remote_creation_lock:
            result = create_user_remote_container(
                remote_name, base_url, package_content, policy_type, cacert, key, logger, tag_val
            )
        if not result:
            return False, package_identifier
    
    sync_result = sync_container_repository(repository_name, remote_name, package_content, logger)

    if sync_result is False or (isinstance(sync_result, dict) and sync_result.get("returncode", 1) != 0):
        return False, package_identifier

    return True, package_identifier

def handle_user_image_registry(package, package_content, version_variables, user_registries, logger):
    """
    Checks user-defined container registries for the presence of a
    specific image (by tag or digest) and processes it if found.

    Parameters:
        package (dict): Dictionary containing package metadata.
        package_content (str): Image name or content identifier.
        version_variables (dict): Variables used to render the tag template.
        user_registries (list): List of user registries with required authentication and TLS information.
        logger (logging.Logger): Logger object for logging messages.

    Returns:
        tuple: (True, package content) if image is found and successfully processed; False otherwise.
    """
    logger.info("#" * 30 + f" {handle_user_image_registry.__name__} start " + "#" * 30)
    result = False
    package_info = None
    image_name = package_content
    tag_val = None

    try:
        # Determine tag or digest for the image
        if "tag" in package:
            tag_template = Template(package["tag"])
            tag_val = tag_template.render(**version_variables)
        elif "digest" in package:
            digest_hash = package["digest"]
            tag_val = f"sha256:{digest_hash}"

        for registry in user_registries:
            host = registry.get("host")
            cacert = registry.get("cert_path")
            key = registry.get("key_path")
            # username = registry.get("username")
            # password = registry.get("password")

            logger.info(f"Checking image {image_name}:{tag_val} in registry {host}")
            image_found = check_image_in_registry(
                host=host,
                image=image_name,
                tag=tag_val,
                cacert=cacert,
                key=key,
                username=None,
                password=None,
                logger=logger
            )

            if image_found:
                logger.info(f"Image '{image_name}:{tag_val}' found in registry '{host}'")
                result, package_info = process_user_registry(package, host, package_content, version_variables, cacert, key, logger)
                break
            else:
                logger.info(f"Image '{image_name}:{tag_val}' not found in registry '{host}', checking next registry...")
        else:
            logger.info(f"Image '{image_name}:{tag_val}' not found in any user registry")
            result = False

    except Exception as e:
        logger.error(f"Exception in {handle_user_image_registry.__name__}: {e}")
        result = False

    logger.info("#" * 30 + f" {handle_user_image_registry.__name__} end " + "#" * 30)
    return result, package_info


================================================
FILE: common/library/module_utils/local_repo/validate_utils.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# pylint: disable=import-error,no-name-in-module
import os
import yaml
from ansible.module_utils.local_repo.common_functions import (
    load_yaml_file,
    get_repo_list,
)

def get_pem_files(repo_cert_path):
    """
	Retrieves a list of .pem files from a specified repository certificate path.

	Parameters:
		repo_cert_path (str): The path to the repository certificates.

	Returns:
		list: A list of .pem file names if the directory exists, otherwise None.
	"""
    if not os.path.isdir(repo_cert_path):
        return None  # Explicitly indicate missing directory
    return [f for f in os.listdir(repo_cert_path) if f.endswith(".pem")]

def validate_repo_certificates(repo_list, certs_path):
    """
	Validates the repository certificates based on the provided repository list and certificate path.

	Parameters:
		repo_list (list): A list of dictionaries containing repository information.
		certs_path (str): The path to the repository certificates.

	Returns:
		list: A list of strings describing certificate issues for each repository.
	"""

    cert_issues = []

    if not repo_list:
        return cert_issues

    for repo in repo_list:
        repo_name = repo.get("name", "unnamed_repo")
        repo_cert_path = os.path.join(certs_path, repo_name)

        cert_keys = ["sslcacert", "sslclientkey", "sslclientcert"]
        cert_values = {key: repo.get(key) for key in cert_keys}

        # # Skip if all cert values are None, No cert scenario
        if all(value is None for value in cert_values.values()):
            continue

        if not os.path.isdir(repo_cert_path):
            cert_issues.append(f"{repo_name} (certificate path not found)")
            continue

        all_files = os.listdir(repo_cert_path)
        pem_files = [f for f in all_files if f.endswith(".pem")]
        key_files = [f for f in all_files if f.endswith(".key")]
        crt_files = [f for f in all_files if f.endswith(".crt")]

        issues = []

        if len(pem_files) != 3:
            issues.append(f"{len(pem_files)} .pem files found: {pem_files}")
        if len(key_files) > 1:
            issues.append(f"{len(key_files)} .key files found: {key_files}")
        if len(crt_files) > 1:
            issues.append(f"{len(crt_files)} .crt files found: {crt_files}")

        if issues:
            cert_issues.append(f"{repo_name} ({'; '.join(issues)})")

    return cert_issues


def validate_certificates(local_repo_config_path, certs_path, repo_key="user_repo_url"):
    """
	Validates the repository certificates based on the provided repository list and certificate path.

	Parameters:
		local_repo_config_path (str): The path to the local repository configuration file.
		certs_path (str): The path to the repository certificates.
		repo_key (str): The key to access the repository list in the configuration file (default: "user_repo_url").

	Returns:
		dict: A dictionary containing the validation status and a list of issues if any.
	"""

    config_file = load_yaml_file(local_repo_config_path)
    repo_list = get_repo_list(config_file, repo_key)

    issues = validate_repo_certificates(repo_list, certs_path)

    if issues:
        return {"status": "error", "missing": issues}

    return {"status": "ok"}


================================================
FILE: common/library/modules/additional_images_collector.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

# pylint: disable=import-error,no-name-in-module
#!/usr/bin/python

"""
Ansible module to collect container images from additional_packages.json.
Returns a dict of role-specific images for crictl pull operations.
"""

from ansible.module_utils.basic import AnsibleModule
from ansible.module_utils.build_image.config import ROLE_SPECIFIC_KEYS, IMAGE_ROLE_KEYS
from ansible.module_utils.build_image.common_functions import (
    load_json_file,
    is_additional_packages_enabled,
    get_allowed_additional_subgroups
)

def extract_images_from_cluster(cluster_items):
    """
    Extract image entries (type: "image") from a cluster list.

    Args:
        cluster_items (list): List of package items.

    Returns:
        list: List of dicts with 'package' and either 'tag' or 'digest'.
              Each dict contains 'pull_ref' for the complete crictl pull reference.
    """
    if not cluster_items or not isinstance(cluster_items, list):
        return []

    images = []
    for item in cluster_items:
        if item.get('type') == 'image' and item.get('package'):
            package = item['package']
            image_entry = {'package': package}

            # Digest takes precedence over tag (more specific)
            if item.get('digest'):
                image_entry['digest'] = item['digest']
                image_entry['pull_ref'] = f"{package}@{item['digest']}"
            else:
                tag = item.get('tag', 'latest')
                image_entry['tag'] = tag
                image_entry['pull_ref'] = f"{package}:{tag}"

            images.append(image_entry)

    return images


def collect_additional_images(additional_json_path, software_config, module):
    """
    Collect container images from additional_packages.json.

    Global images (under additional_packages.cluster[]) go to all IMAGE_ROLE_KEYS.
    Role-specific images go only to their specific role.
    Only processes roles that are in allowed_subgroups from software_config.json.

    Args:
        additional_json_path (str): Path to additional_packages.json.
        software_config (dict): Parsed software_config.json content.
        module: Ansible module instance.

    Returns:
        dict: Role-keyed dict of image lists.
    """
    if not is_additional_packages_enabled(software_config):
        return {}

    data = load_json_file(additional_json_path, module)
    if not data:
        return {}

    allowed_subgroups = get_allowed_additional_subgroups(software_config)
    result = {}

    # Extract global images from additional_packages.cluster[]
    additional_packages = data.get('additional_packages', {})
    global_images = extract_images_from_cluster(additional_packages.get('cluster', []))

    # Initialize result dict for allowed IMAGE_ROLE_KEYS with global images
    for role in IMAGE_ROLE_KEYS:
        if role in allowed_subgroups:
            result[role] = list(global_images)

    # Add role-specific images for allowed subgroups
    for role in allowed_subgroups:
        if role in ROLE_SPECIFIC_KEYS and role in data:
            role_data = data.get(role, {})
            role_images = extract_images_from_cluster(role_data.get('cluster', []))

            if role in result:
                result[role].extend(role_images)
            elif role_images:
                result[role] = role_images

    # Deduplicate images in each role while preserving order (using pull_ref)
    for role in result:
        seen = set()
        unique_images = []
        for img in result[role]:
            if img['pull_ref'] not in seen:
                unique_images.append(img)
                seen.add(img['pull_ref'])
        result[role] = unique_images

    return result


def run_module():
    """
    Run the Ansible module.

    Collects container images from additional_packages.json,
    returns a dict keyed by role with image lists for crictl pull.
    """
    module_args = dict(
        additional_json_path=dict(type="str", required=True),
        software_config_path=dict(type="str", required=True),
    )

    result = dict(
        changed=False,
        additional_images_dict={}
    )

    module = AnsibleModule(argument_spec=module_args, supports_check_mode=True)

    additional_json_path = module.params["additional_json_path"]
    software_config_path = module.params["software_config_path"]

    # Load software_config.json
    software_config = load_json_file(software_config_path, module)

    # Collect images from additional_packages.json
    additional_images = collect_additional_images(
        additional_json_path, software_config, module
    )
    result["additional_images_dict"] = additional_images

    module.exit_json(**result)


def main():
    """Main entry point."""
    run_module()


if __name__ == "__main__":
    main()


================================================
FILE: common/library/modules/base_image_package_collector.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

# pylint: disable=import-error,no-name-in-module
#!/usr/bin/python

"""Ansible module to collect RPM packages from default_packages.json, additional_packages.json,
and admin_debug_packages.json. Returns a flat list of package names for base image building."""

from ansible.module_utils.basic import AnsibleModule
from ansible.module_utils.build_image.common_functions import (
    load_json_file,
    is_additional_packages_enabled,
    is_admin_debug_enabled,
    extract_rpm_package_names,
    deduplicate_list
)


def collect_default_packages(json_path, module):
    """
    Collect RPM package names from default_packages.json.

    Args:
        json_path (str): Path to default_packages.json.
        module (AnsibleModule): The Ansible module instance.

    Returns:
        list: List of package names.
    """
    data = load_json_file(json_path, module)
    if not data:
        return []

    default_packages = data.get('default_packages', {})
    cluster_items = default_packages.get('cluster', [])
    return extract_rpm_package_names(cluster_items)


def collect_additional_global_packages(json_path, module):
    """
    Collect ONLY global RPM package names from additional_packages.json.
    Role-specific packages are handled by image_package_collector.py.

    Args:
        json_path (str): Path to additional_packages.json.
        module (AnsibleModule): The Ansible module instance.

    Returns:
        list: List of global package names.
    """
    data = load_json_file(json_path, module)
    if not data:
        return []

    # Only global RPMs from additional_packages.cluster[]
    additional_packages = data.get('additional_packages', {})
    global_cluster = additional_packages.get('cluster', [])
    return extract_rpm_package_names(global_cluster)


def collect_admin_debug_packages(json_path, module):
    """
    Collect RPM package names from admin_debug_packages.json.

    Args:
        json_path (str): Path to admin_debug_packages.json.
        module (AnsibleModule): The Ansible module instance.

    Returns:
        list: List of admin debug package names.
    """
    data = load_json_file(json_path, module)
    if not data:
        return []

    admin_debug_packages = data.get('admin_debug_packages', {})
    cluster_items = admin_debug_packages.get('cluster', [])
    return extract_rpm_package_names(cluster_items)


def run_module():
    """
    Run the Ansible module.

    Collects RPM packages from default_packages.json, additional_packages.json,
    and admin_debug_packages.json, returns a combined flat list of unique package names.
    """
    module_args = dict(
        default_json_path=dict(type="str", required=True),
        additional_json_path=dict(type="str", required=False, default=""),
        admin_debug_json_path=dict(type="str", required=False, default=""),
        software_config_path=dict(type="str", required=True),
    )

    result = dict(
        changed=False,
        base_image_packages=[],
        default_packages=[],
        additional_packages=[],
        admin_debug_packages=[]
    )

    module = AnsibleModule(argument_spec=module_args, supports_check_mode=True)

    default_json_path = module.params["default_json_path"]
    additional_json_path = module.params["additional_json_path"]
    admin_debug_json_path = module.params["admin_debug_json_path"]
    software_config_path = module.params["software_config_path"]

    # Load software_config.json
    software_config = load_json_file(software_config_path, module)

    # Collect from default_packages.json
    default_pkgs = collect_default_packages(default_json_path, module)
    result["default_packages"] = default_pkgs

    # Collect ONLY global packages from additional_packages.json if enabled
    # Role-specific packages are handled by image_package_collector.py
    additional_pkgs = []
    if additional_json_path and is_additional_packages_enabled(software_config):
        additional_pkgs = collect_additional_global_packages(additional_json_path, module)
    result["additional_packages"] = additional_pkgs

    # Collect admin debug packages if enabled
    admin_debug_pkgs = []
    if admin_debug_json_path and is_admin_debug_enabled(software_config):
        admin_debug_pkgs = collect_admin_debug_packages(admin_debug_json_path, module)
    result["admin_debug_packages"] = admin_debug_pkgs

    # Combine and deduplicate while preserving order
    combined = default_pkgs + additional_pkgs + admin_debug_pkgs
    result["base_image_packages"] = deduplicate_list(combined)
    module.exit_json(**result)


def main():
    """Main entry point."""
    run_module()


if __name__ == "__main__":
    main()


================================================
FILE: common/library/modules/cert_vault_handler.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

# pylint: disable=import-error,no-name-in-module
#!/usr/bin/python
import os
from datetime import datetime
from ansible.module_utils.basic import AnsibleModule
from ansible.module_utils.local_repo.standard_logger import setup_standard_logger
from ansible.module_utils.local_repo.common_functions import process_file, load_yaml_file, generate_vault_key
from ansible.module_utils.local_repo.config import (
    USER_REPO_URL,
    LOCAL_REPO_CONFIG_PATH_DEFAULT,
    CERT_KEYS
)

def extract_repos_with_certs(repo_entries, log):
    """
    Extracts repositories that include SSL certificate configuration.

    Args:
        repo_entries (list): List of dictionaries with possible keys:
                             'name', 'sslcacert', 'sslclientkey', 'sslclientcert'.

    Returns:
        list: A list of dictionaries, each containing 'name', 'sslcacert',
              'sslclientkey', and 'sslclientcert' for repos where 'sslcacert' is present.
    """
    results = []

    for entry in repo_entries:
        if "sslcacert" in entry and entry["sslcacert"]:
            results.append({
                "name": entry.get("name", "unknown"),
                "sslcacert": entry["sslcacert"],
                "sslclientkey": entry.get("sslclientkey", ""),
                "sslclientcert": entry.get("sslclientcert", "")
            })
    log.info(f"Appended result with number of entries: {len(results)}")
    return results

def main():
    """
    Encrypt or decrypt files using Ansible Vault.

    The module takes in the following parameters:
        * file_path: The path to the file to encrypt or decrypt.
        * dir_path: The path to the directory containing files to encrypt or decrypt.
        * key_path: The path to the Ansible Vault key.
        * mode: The mode of operation, either 'encrypt' or 'decrypt'.

    The module is mutually exclusive for file_path and dir_path.
    The module requires one of file_path or dir_path.
    The module does not support check mode.
    """
    module = AnsibleModule(
    argument_spec={
        'mode': {'type': 'str', 'required': True, 'choices': ['encrypt', 'decrypt']},
        'log_dir': {'type': 'str', 'required': False, 'default': '/tmp/thread_logs'},
        'key_path': {'type': 'str', 'required': True}
    },
    supports_check_mode=False
    )
    mode = module.params['mode']
    log_dir = module.params["log_dir"]
    vault_key_path = module.params["key_path"]
    log = setup_standard_logger(log_dir)

    start_time = datetime.now().strftime("%I:%M:%S %p")

    log.info(f"Start execution time cert_vault_handler: {start_time}")

    local_repo_path = os.path.join(vault_key_path, "local_repo_config.yml")
    local_repo_config = load_yaml_file(local_repo_path)
    user_repos = local_repo_config.get(USER_REPO_URL, [])
    if not user_repos:
        log.info("No user repo found, proceeding without encryption")
        module.exit_json()

    cert_entries = extract_repos_with_certs(user_repos, log)
    for entry in cert_entries:
        for key in CERT_KEYS:
            path = entry.get(key)
            if path and not os.path.isfile(path):
                module.fail_json(msg=f"Missing {key} for repo '{entry['name']}': {path}")

    messages = []
    changed = False

    if cert_entries:
        vault_key_path = os.path.join(vault_key_path, ".local_repo_credentials_key")
        gen_result = {}
        gen_result = generate_vault_key(vault_key_path)
        if gen_result is None:
            module.fail_json(msg=f"Unable to create key: {vault_key_path}")
        log.info("User repo found, proceeding to encrypt")
        for entry in cert_entries:
            for key in CERT_KEYS:
                path = entry.get(key)
                if path:
                    result, msg = process_file(path, vault_key_path, mode)
                    if result is False:
                        module.fail_json(msg=f"Failed to {mode} {key} for '{entry['name']}': {msg}")
                    else:
                        messages.append(msg)
                        changed = True

    module.exit_json(changed=changed, msg="; ".join(messages))

if __name__ == '__main__':
    main()


================================================
FILE: common/library/modules/check_user_registry.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

# pylint: disable=import-error,no-name-in-module
#!/usr/bin/python

from ansible.module_utils.basic import AnsibleModule
from ansible.module_utils.local_repo.common_functions import (
    load_yaml_file,
    get_repo_list,
    is_encrypted,
    process_file
)
from ansible.module_utils.local_repo.registry_utils import (
    validate_user_registry,
    check_reachability,
    find_invalid_cert_paths
)
# from ansible.module_utils.local_repo.config import (
#     USER_REG_CRED_INPUT,
#     USER_REG_KEY_PATH
# )

def main():
    """
    Ansible module to validate user registry entries.
    """
    module = AnsibleModule(
        # argument_spec=dict(
        #     timeout=dict(type='int', default=5),
        #     config_file=dict(type='str', required=True),
        #     user_reg_cred_input=dict(type='str', required=False, default=USER_REG_CRED_INPUT),
        #     user_reg_key_path=dict(type='str', required=False, default=USER_REG_KEY_PATH)
        # ),
        argument_spec=dict(
            timeout=dict(type='int', default=5),
            config_file=dict(type='str', required=True)
        ),
        supports_check_mode=True
    )

    # config_path = module.params['config_file']
    # timeout = module.params['timeout']
    # user_reg_cred_input = module.params["user_reg_cred_input"]
    # user_reg_key_path = module.params["user_reg_key_path"]

    config_path = module.params['config_file']
    timeout = module.params['timeout']
    try:
        config_data = load_yaml_file(config_path)
    except FileNotFoundError as e:
        module.fail_json(msg=str(e))

    user_registry = get_repo_list(config_data, "user_registry")
    # if user_registry:
    #     # Load credentials
    #     if is_encrypted(user_reg_cred_input):
    #         process_file(user_reg_cred_input, user_reg_key_path, 'decrypt')

    #     file2_data = load_yaml_file(user_reg_cred_input)
    #     cred_lookup = {
    #         entry['name']: entry
    #         for entry in file2_data.get('user_registry_credential', [])
    #     }

    #     # Update user_registry entries with credentials if required
    #     for registry in user_registry:
    #         if registry.get("requires_auth"):
    #             creds = cred_lookup.get(registry.get("name"))
    #             if creds:
    #                 registry["username"] = creds.get("username")
    #                 registry["password"] = creds.get("password")

    # Exit early if user_registry is empty
    if not user_registry:
        module.exit_json(
            changed=False,
            msg="No user registry entries found. Skipping validation.",
            reachable_registries=[],
            unreachable_registries=[],
            unreachable_count=0
        )

    # Validate entries
    is_valid, error_msg = validate_user_registry(user_registry)
    if not is_valid:
        module.fail_json(msg=f"[Validation Error] {error_msg}")

    # Reachability
    reachable, unreachable = check_reachability(user_registry, timeout)

    # Cert path validation
    invalid_paths = find_invalid_cert_paths(user_registry)
    if invalid_paths:
        module.fail_json(msg=f"[Cert Path Error] Invalid cert_path(s): {invalid_paths}")

    module.exit_json(
        changed=False,
        reachable_registries=reachable,
        unreachable_registries=unreachable,
        unreachable_count=len(unreachable)
    )

if __name__ == '__main__':
    main()


================================================
FILE: common/library/modules/delete_idracips_from_mysqldb.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

#!/usr/bin/python
"""Module to delete iDRAC IPs from MySQL database.
This module connects to a Kubernetes pod running MySQL and deletes iDRAC IPs
that are not present in bmc_data.csv. It handles retries and delays for robustness."""

import time
from ansible.module_utils.basic import AnsibleModule
from kubernetes import client, config
from kubernetes.stream import stream
from kubernetes.config.config_exception import ConfigException


def load_kube_context():
    """Load Kubernetes configuration for accessing the cluster."""
    try:
        config.load_kube_config()
    except ConfigException:
        config.load_incluster_config()


def run_mysql_query_in_pod(namespace, pod, container, mysql_user, mysql_password, query):
    """Run a MySQL query in the specified pod.

    Args:
        namespace: Kubernetes namespace
        pod: Pod name
        container: Container name
        mysql_user: MySQL username
        mysql_password: MySQL password
        query: MySQL query to execute

    Returns:
        dict: Result containing return code and output
    """
    core_v1 = client.CoreV1Api()
    mysql_command = [
        "mysql",
        "-u", mysql_user,
        "-N", "-B",
        f"-p{mysql_password}",
        "-e", query
    ]

    try:
        ws = stream(
            core_v1.connect_get_namespaced_pod_exec,
            name=pod,
            namespace=namespace,
            container=container,
            command=mysql_command,
            stderr=True,
            stdin=False,
            stdout=True,
            tty=False,
            _preload_content=False
        )

        stdout = ""
        stderr = ""

        while ws.is_open():
            ws.update(timeout=1)
            if ws.peek_stdout():
                stdout += ws.read_stdout()
            if ws.peek_stderr():
                stderr += ws.read_stderr()
        ws.close()

        rc = ws.returncode

        if rc != 0:
            return {
                "rc": rc,
                "result": stderr.strip() if stderr else "Unknown error"
            }

        query_result = [
            line.strip() for line in stdout.strip().splitlines()
            if line.strip() and not line.strip().startswith("mysql:")
        ]

        return {
            "rc": rc,
            "result": query_result
        }

    except (ConfigException, OSError) as e:
        return {
            "rc": 1,
            "result": str(e)
        }


def delete_idrac_from_mysql(
    namespace,
    pod,
    container,
    mysqldb_name,
    mysql_user,
    mysql_password,
    ip_to_delete,
    retries=3,
    delay=3
):
    """Delete a single iDRAC IP from MySQL database.

    Args:
        namespace: Kubernetes namespace
        pod: Pod name
        container: Container name
        mysqldb_name: MySQL database name
        mysql_user: MySQL username
        mysql_password: MySQL password
        ip_to_delete: IP address to delete
        retries: Number of retry attempts
        delay: Delay between retries in seconds

    Returns:
        dict: Result containing success status and message
    """
    query = (
        f"DELETE FROM {mysqldb_name}.services "
        f"WHERE ip = '{ip_to_delete}';"
    )

    for attempt in range(retries):
        result = run_mysql_query_in_pod(
            namespace=namespace,
            pod=pod,
            container=container,
            mysql_user=mysql_user,
            mysql_password=mysql_password,
            query=query
        )

        if result.get("rc") == 0:
            return {
                "success": True,
                "ip": ip_to_delete,
                "msg": f"Successfully deleted iDRAC IP {ip_to_delete} from MySQL."
            }

        if attempt < retries - 1:
            time.sleep(delay)

    return {
        "success": False,
        "ip": ip_to_delete,
        "msg": f"Failed to delete iDRAC IP {ip_to_delete} after {retries} attempts: {result.get('result')}"
    }


def main():
    """Main function to execute the module logic."""
    module_args = {
        "telemetry_namespace": {"type": "str", "required": True},
        "idrac_podnames": {"type": "list", "required": True},
        "mysqldb_k8s_name": {"type": "str", "required": True},
        "mysqldb_name": {"type": "str", "required": True},
        "mysqldb_user": {"type": "str", "required": True, "no_log": True},
        "mysqldb_password": {"type": "str", "required": True, "no_log": True},
        "ips_to_delete": {"type": "list", "required": True},
        "pod_to_db_idrac_ips": {"type": "dict", "required": True},
        "db_retries": {"type": "int", "default": 3},
        "db_delay": {"type": "int", "default": 3},
    }

    module = AnsibleModule(argument_spec=module_args, supports_check_mode=True)

    telemetry_namespace = module.params["telemetry_namespace"]
    idrac_podnames = module.params["idrac_podnames"]
    mysqldb_k8s_name = module.params["mysqldb_k8s_name"]
    mysqldb_name = module.params["mysqldb_name"]
    mysqldb_user = module.params["mysqldb_user"]
    mysqldb_password = module.params["mysqldb_password"]
    ips_to_delete = module.params["ips_to_delete"]
    pod_to_db_idrac_ips = module.params["pod_to_db_idrac_ips"]
    db_retries = module.params["db_retries"]
    db_delay = module.params["db_delay"]

    load_kube_context()

    deleted_ips = []
    failed_ips = []
    changed = False

    try:
        for pod in idrac_podnames:
            pod_ips = pod_to_db_idrac_ips.get(pod, [])
            ips_to_delete_from_pod = list(set(pod_ips) & set(ips_to_delete))

            if not ips_to_delete_from_pod:
                module.warn(f"No IPs to delete from pod {pod}. Skipping.")
                continue

            module.warn(f"Deleting IPs from pod {pod}: {ips_to_delete_from_pod}")

            for ip in ips_to_delete_from_pod:
                result = delete_idrac_from_mysql(
                    namespace=telemetry_namespace,
                    pod=pod,
                    container=mysqldb_k8s_name,
                    mysqldb_name=mysqldb_name,
                    mysql_user=mysqldb_user,
                    mysql_password=mysqldb_password,
                    ip_to_delete=ip,
                    retries=db_retries,
                    delay=db_delay
                )

                if result.get("success"):
                    deleted_ips.append(ip)
                    changed = True
                else:
                    failed_ips.append({
                        "pod": pod,
                        "ip": ip,
                        "msg": result.get("msg", "Unknown error")
                    })

        module.exit_json(
            changed=changed,
            deleted_ips=deleted_ips,
            failed_ips=failed_ips,
            msg=f"Deleted {len(deleted_ips)} iDRAC IPs from MySQL database."
        )

    except (OSError, ValueError) as e:
        module.fail_json(
            msg=f"An error occurred while deleting iDRAC IPs from MySQL: {str(e)}",
            deleted_ips=deleted_ips,
            failed_ips=failed_ips
        )


if __name__ == "__main__":
    main()


================================================
FILE: common/library/modules/disable_idrac_telemetry.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

#!/usr/bin/python
"""Module to disable telemetry on iDRAC nodes via Redfish API.
This module connects to iDRAC nodes and disables telemetry collection
by sending PATCH requests to the Redfish API endpoint."""

import requests
import urllib3
from ansible.module_utils.basic import AnsibleModule

urllib3.disable_warnings(urllib3.exceptions.InsecureRequestWarning)


def disable_telemetry_on_idrac(idrac_ip, username, password, timeout=30):
    """
    Disable telemetry on a single iDRAC node using Redfish API.

    Args:
        idrac_ip: IP address of the iDRAC
        username: iDRAC username
        password: iDRAC password
        timeout: Request timeout in seconds

    Returns:
        dict: Result containing success status and message
    """
    url = (
        f"https://{idrac_ip}/redfish/v1/Managers/"
        f"iDRAC.Embedded.1/Attributes"
    )

    # Try different telemetry property names in order of preference
    telemetry_properties = [
        "Telemetry.1.EnableTelemetry",
        "TelemetryService.1.EnableTelemetry", 
        "Telemetry.2.EnableTelemetry",
        "Redfish.1.TelemetryServiceEnabled"
    ]

    headers = {
        "Content-Type": "application/json"
    }

    for property_name in telemetry_properties:
        payload = {
            "Attributes": {
                property_name: "Disabled"
            }
        }

        try:
            response = requests.patch(
                url,
                json=payload,
                headers=headers,
                auth=(username, password),
                verify=False,
                timeout=timeout
            )
            
            if response.status_code in [200, 202, 204]:
                return {
                    "success": True,
                    "ip": idrac_ip,
                    "status_code": response.status_code,
                    "msg": f"Successfully disabled telemetry on iDRAC {idrac_ip} using {property_name}"
                }
            elif response.status_code == 400:
                # Property not supported, try next one
                continue
            else:
                return {
                    "success": False,
                    "ip": idrac_ip,
                    "status_code": response.status_code,
                    "msg": (
                        f"Failed to disable telemetry on iDRAC {idrac_ip}. "
                        f"Status: {response.status_code}, Response: {response.text}"
                    )
                }
        
        except requests.exceptions.Timeout:
            return {
                "success": False,
                "ip": idrac_ip,
                "msg": f"Timeout while connecting to iDRAC {idrac_ip}"
            }
        
        except requests.exceptions.ConnectionError:
            return {
                "success": False,
                "ip": idrac_ip,
                "msg": f"Connection error while connecting to iDRAC {idrac_ip}"
            }
        
        except (requests.exceptions.RequestException, OSError) as e:
            return {
                "success": False,
                "ip": idrac_ip,
                "msg": f"Error disabling telemetry on iDRAC {idrac_ip}: {str(e)}"
            }

    # All properties failed
    return {
        "success": False,
        "ip": idrac_ip,
        "msg": (
            f"Failed to disable telemetry on iDRAC {idrac_ip}. "
            f"None of the supported telemetry properties were found: {', '.join(telemetry_properties)}"
        )
    }


def main():
    """Main function to execute the module logic."""
    module_args = {
        "idrac_ips": {"type": "list", "required": True, "elements": "str"},
        "username": {"type": "str", "required": True, "no_log": True},
        "password": {"type": "str", "required": True, "no_log": True},
        "timeout": {"type": "int", "default": 30},
    }

    module = AnsibleModule(
        argument_spec=module_args,
        supports_check_mode=True
    )

    idrac_ips = module.params["idrac_ips"]
    username = module.params["username"]
    password = module.params["password"]
    timeout = module.params["timeout"]

    disabled_ips = []
    failed_ips = []
    changed = False

    try:
        for idrac_ip in idrac_ips:
            result = disable_telemetry_on_idrac(
                idrac_ip=idrac_ip,
                username=username,
                password=password,
                timeout=timeout
            )

            if result.get("success"):
                disabled_ips.append(idrac_ip)
                changed = True
            else:
                failed_ips.append({
                    "ip": idrac_ip,
                    "msg": result.get("msg", "Unknown error")
                })

        module.exit_json(
            changed=changed,
            disabled_ips=disabled_ips,
            failed_ips=failed_ips,
            msg=f"Disabled telemetry on {len(disabled_ips)} iDRAC nodes."
        )

    except (requests.exceptions.RequestException, OSError) as e:
        module.fail_json(
            msg=f"An error occurred while disabling telemetry: {str(e)}",
            disabled_ips=disabled_ips,
            failed_ips=failed_ips
        )


if __name__ == "__main__":
    main()


================================================
FILE: common/library/modules/enable_telemetry_service.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""
Dell iDRAC Telemetry - FAST Enable All Reports.

Optimized with parallel processing and connection pooling.
Supports iDRAC 9 and iDRAC 10.
"""

import logging
import os
import time
from concurrent.futures import ThreadPoolExecutor, as_completed
from typing import Dict, List, Optional, Any, Tuple
import requests
import urllib3
from ansible.module_utils.basic import AnsibleModule

# Disable SSL warnings
urllib3.disable_warnings(urllib3.exceptions.InsecureRequestWarning)
#####################################################
# ALL 37 TELEMETRY REPORTS (iDRAC 9 & 10)
#####################################################

ALL_REPORTS: List[str] = [
    "AggregationMetrics", "CPUMemMetrics", "CPURegisters",
    "CPUSensor", "MemoryMetrics", "MemorySensor",
    "NVMeSMARTData", "StorageDiskSMARTData", "StorageSensor",
    "NICSensor", "NICStatistics", "FCPortStatistics",
    "FCSensor", "SFPTransceiver", "InfiniBandStatistics",
    "PSUMetrics", "PowerMetrics", "PowerStatistics",
    "FanSensor", "ThermalMetrics", "ThermalSensor",
    "GPUMetrics", "GPUStatistics", "GPUSubsystemPower", "FPGASensor",
    "Sensor", "SerialLog", "SystemUsage", "x86SubsystemPower",
    "OME-ISM-MetricsData", "OME-PMP-Power-B",
    "OME-SFPTransceiver-Metrics", "OME-Telemetry-FCPortStatistics",
    "OME-Telemetry-GPU-Aggregate", "OME-Telemetry-GPU-Aggregate-1",
    "OME-Telemetry-NIC-Statistics", "OME-Telemetry-SMARTData",
]

def get_report_definitions(
    ip_address: str,
    user: str,
    password: str,
    session: requests.Session,
    timeout: int,
) -> Optional[List[str]]:
    """Fetch available report definitions from iDRAC."""
    url = f"https://{ip_address}/redfish/v1/TelemetryService/MetricReportDefinitions"
    try:
        response = session.get(
            url,
            auth=(user, password),
            verify=False,
            timeout=timeout,
        )
        if response.status_code == 200:
            data = response.json()
            return [
                member['@odata.id'].split('/')[-1]
                for member in data.get('Members', [])
            ]
    except (requests.exceptions.RequestException, ValueError, KeyError):
        pass
    return None


def enable_report(
    session: requests.Session,
    url: str,
    user: str,
    password: str,
    timeout: int,
) -> bool:
    """Enable a single telemetry report."""
    try:
        data = {
            "MetricReportDefinitionEnabled": True,
            "Status": {"State": "Enabled"}
        }
        response = session.patch(
            url,
            json=data,
            auth=(user, password),
            verify=False,
            timeout=timeout,
        )
        return response.status_code in [200, 202, 204]
    except requests.exceptions.RequestException:
        return False


def enable_reports_parallel(
    session: requests.Session,
    base_url: str,
    reports_to_enable: List[str],
    user: str,
    password: str,
    timeout: int,
    report_workers: int = 10,
) -> Tuple[List[str], List[str]]:
    """Enable multiple reports in parallel."""
    enabled_reports: List[str] = []
    failed_reports: List[str] = []

    report_urls = {
        report: f"{base_url}/MetricReportDefinitions/{report}"
        for report in reports_to_enable
    }

    with ThreadPoolExecutor(max_workers=report_workers) as executor:
        future_to_report = {
            executor.submit(enable_report, session, url, user, password, timeout): report
            for report, url in report_urls.items()
        }
        for future in as_completed(future_to_report):
            report_name = future_to_report[future]
            if future.result():
                enabled_reports.append(report_name)
            else:
                failed_reports.append(report_name)

    return enabled_reports, failed_reports


def configure_server(
    ip_address: str,
    user: str,
    password: str,
    timeout: int,
    exclude_reports: Optional[List[str]] = None,
) -> Dict[str, Any]:
    """Configure telemetry for a single server."""
    session = requests.Session()
    session.verify = False
    exclude_reports = exclude_reports or []

    try:
        base_url = f"https://{ip_address}/redfish/v1/TelemetryService"

        # Step 1: Enable Telemetry Service
        response = session.patch(
            base_url,
            json={"ServiceEnabled": True},
            auth=(user, password),
            timeout=timeout,
        )

        if response.status_code not in [200, 202, 204]:
            return {
                "ip": ip_address,
                "status": "failed",
                "message": f"Service HTTP {response.status_code}"
            }

        # Step 2: Get available reports
        available_reports = get_report_definitions(
            ip_address, user, password, session, timeout
        )
        if not available_reports:
            return {
                "ip": ip_address,
                "status": "failed",
                "message": "Cannot get reports"
            }

        # Step 3: Filter out excluded reports
        reports_to_enable = [
            r for r in available_reports if r not in exclude_reports
        ]
        skipped_reports = [
            r for r in available_reports if r in exclude_reports
        ]

        # Step 4: Enable reports in parallel
        enabled_reports, failed_reports = enable_reports_parallel(
            session, base_url, reports_to_enable, user, password, timeout
        )

        return {
            "ip": ip_address,
            "status": "success",
            "message": f"{len(enabled_reports)}/{len(available_reports)} enabled",
            "total_reports": len(available_reports),
            "enabled_reports": enabled_reports,
            "skipped_reports": skipped_reports,
            "failed_reports": failed_reports,
        }

    except requests.exceptions.RequestException as e:
        return {
            "ip": ip_address,
            "status": "failed",
            "message": str(e)
        }

    finally:
        try:
            session.close()
        except OSError as close_error:
            logging.warning("Warning: failed to close session for %s: %s", ip_address, close_error)

def run_parallel(
    idrac_ips: List[str],
    username: str,
    password: str,
    parallel_jobs: int,
    timeout: int,
    exclude_reports: Optional[List[str]] = None,
) -> Tuple[List[Dict], List[Dict]]:
    """Run telemetry configuration in parallel."""
    success_results = []
    failed_results = []

    try:
        workers = max(1, min(os.cpu_count() + 1, parallel_jobs))
        with ThreadPoolExecutor(max_workers=workers) as executor:
            future_to_ip = {
                executor.submit(
                    configure_server, ip, username, password, timeout, exclude_reports
                ): ip for ip in idrac_ips
            }

            for future in as_completed(future_to_ip):
                result = future.result()
                if result.get("status") == "success":
                    success_results.append(result)
                else:
                    failed_results.append(result)
    except (OSError, ValueError, requests.exceptions.RequestException) as exc:
        logging.warning("Error during parallel execution: %s", exc)

    return success_results, failed_results

def main():
    """Main function for Ansible module."""
    module_args = {
        "idrac_ips": {"type": "list", "required": True, "elements": "str"},
        "username": {"type": "str", "required": True},
        "password": {"type": "str", "required": True, "no_log": True},
        "parallel_jobs": {"type": "int", "default": 64},
        "timeout": {"type": "int", "default": 30},
        "exclude_reports": {"type": "list", "required": False, "elements": "str", "default": []},
    }

    module = AnsibleModule(argument_spec=module_args, supports_check_mode=True)

    idrac_ips = module.params["idrac_ips"]
    username = module.params["username"]
    password = module.params["password"]
    parallel_jobs = module.params["parallel_jobs"]
    timeout = module.params["timeout"]
    exclude_reports = module.params["exclude_reports"]

    if module.check_mode:
        module.exit_json(changed=False, msg="Check mode - no changes made")

    if not idrac_ips:
        module.exit_json(msg="No iDRAC IPs provided")

    start_time = time.time()
    success_results, failed_results = run_parallel(
        idrac_ips, username, password, parallel_jobs, timeout, exclude_reports
    )

    duration = time.time() - start_time

    # Calculate total reports enabled/failed
    total_enabled = sum(len(r.get("enabled_reports", [])) for r in success_results)
    total_failed = sum(len(r.get("failed_reports", [])) for r in success_results)
    total_skipped = sum(len(r.get("skipped_reports", [])) for r in success_results)

    module.exit_json(
        changed=len(success_results) > 0,
        success_count=len(success_results),
        failed_count=len(failed_results),
        total_reports_enabled=total_enabled,
        total_reports_failed=total_failed,
        total_reports_skipped=total_skipped,
        duration_seconds=round(duration, 2),
        success_results=success_results,
        failed_results=failed_results,
        msg=f"Telemetry enabled on {len(success_results)}/{len(idrac_ips)} servers ({total_enabled} reports)"
    )

if __name__ == "__main__":
    main()


================================================
FILE: common/library/modules/fetch_credential_rule.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

#!/usr/bin/python

"""This module is used to fetch credential rules."""

import json
import os
from configparser import ConfigParser

from ansible.module_utils.basic import AnsibleModule

def load_rules(file_path):
    """Loads validation rules from JSON file."""
    with open(file_path, 'r') as file:
        return json.load(file)

def fetch_rule(field, rules):
    """Fetches validation rule for a given field."""
    if field not in rules:
        return (False, f"No validation rules found for '{field}'")

    rule = rules[field]
    return (True, rule.get("description", "No description available"))

def main():
    """Main function."""
    module_args = dict(
        credential_field=dict(type="str", required=True),
        module_utils_path=dict(type="str", required=False, default=None)
    )

    module = AnsibleModule(argument_spec=module_args, supports_check_mode=True)
    params = module.params
    module_utils_base = module.params["module_utils_path"]
    credentials_schema = os.path.join(module_utils_base,'input_validation','schema',\
                                      'credential_rules.json')
    # Load validation rules
    try:
        rules = load_rules(credentials_schema)
    except Exception as e:
        module.fail_json(msg=f"Failed to load rules: {e}")

    # Fetch and return rule description
    success, message = fetch_rule(params["credential_field"], rules)
    if success:
        module.exit_json(changed=False, msg=message)
    else:
        module.fail_json(msg=message)

if __name__ == "__main__":
    main()


================================================
FILE: common/library/modules/fetch_idrac_ips.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

# pylint: disable=import-error,no-name-in-module,line-too-long

#!/usr/bin/python
"""Module to map and fetch iDRAC IPs and related information from 
service cluster metadata and BMC group data. This module reads the
service cluster metadata and BMC group data to find iDRAC podnames
and their associated IPs. It checks for service tags and parent status
to filter relevant nodes, then retrieves the iDRAC podnames and IPs 
from the BMC group data. It compiles these details into a dictionary
where keys are iDRAC podnames and values are lists of IPs associated 
with those podnames.
The module also handles cases where no relevant data isfound"""

from ansible.module_utils.basic import AnsibleModule

def fetch_pod_to_idracips(service_cluster_metadata, parent_to_bmc_ip_details, module):
    """
    Maps iDRAC podnames to their associated IPs using service cluster metadata and BMC group data.
    Returns a dictionary where keys are iDRAC podnames and values are lists of IPs.
    """
    idrac_podname_ips = {}

    for node in service_cluster_metadata.values():
        if node.get("service_tag") and node.get("parent_status") is True:
            idrac_podname = node.get("idrac_podname")
            target_tag = node.get("service_tag")

            if not idrac_podname or not target_tag:
                module.warn("Missing idrac_podname or service_tag in service nodes metadata.")
                continue

            if target_tag in parent_to_bmc_ip_details:
                bmc_group_data_list = parent_to_bmc_ip_details.get(target_tag, [])
                if not bmc_group_data_list:
                    module.warn(f"No BMC group data found for service tag {target_tag}.")
                else:
                    module.warn(f"Found BMC group data for service tag \
                    {target_tag}: {bmc_group_data_list}")
                    idrac_podname_ips[idrac_podname] = bmc_group_data_list
            else:
                role_string = node.get("role", "")
                roles = [r.strip() for r in role_string.split(",")]
                if "service_kube_control_plane" in roles:
                    if 'MGMT_node' in parent_to_bmc_ip_details:
                        idrac_podname_ips[idrac_podname] = parent_to_bmc_ip_details['MGMT_node']

    if not idrac_podname_ips:
        module.warn("No iDRAC podnames and IPs found in the service cluster metadata.")

    return idrac_podname_ips

def main():
    """Main function to execute the module logic."""
    # Define the module arguments
    # service_cluster_metadata: Metadata about the service cluster
    # parent_to_bmc_ip_details: Mapping of service tags to BMC group data
    # This module expects these inputs to be provided by the playbook
    # or task that calls this module.
    # It will process these inputs to find iDRAC podnames and their IPs.
    # The output will be a dictionary where keys are iDRAC podnames and
    # values are lists of IPs associated with those podnames.
    module_args = {
        "service_cluster_metadata": {"type":"dict", "required":True},
        "parent_to_bmc_ip_details": {"type":"dict", "required":True}
    }

    module = AnsibleModule(argument_spec=module_args, supports_check_mode=True)
    try:
        service_cluster_metadata = module.params["service_cluster_metadata"]
        module.warn(f"Service Cluster metadata path: {service_cluster_metadata}")
        parent_to_bmc_ip_details = module.params["parent_to_bmc_ip_details"]

        if not service_cluster_metadata:
            module.warn("Service cluster metadata is required but not provided.")
        if not parent_to_bmc_ip_details:
            module.warn("BMC group data list is required but not provided.")

        idrac_podname_ips = fetch_pod_to_idracips(service_cluster_metadata, \
                        parent_to_bmc_ip_details, module)

        module.exit_json(
            changed=False,
            idrac_podname_ips=idrac_podname_ips
        )
    except Exception as e:
        module.fail_json(
            msg=f"An error occurred while fetching iDRAC podnames and IPs: {str(e)}"
        )

if __name__ == "__main__":
    main()


================================================
FILE: common/library/modules/fetch_mapping_details.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
#!/usr/bin/python
# pylint: disable=import-error,no-name-in-module,line-too-long

"""Ansible module to fetch mapping details for nodes in a group."""
from ansible.module_utils.basic import AnsibleModule

def fetch_mapping_details(groups_roles_info, csv_data):
    """
    Fetches the mapping details for the given groups and roles.

    Args:
        groups_roles_info (dict): A dictionary containing groups as keys,
                                  with all details including associated roles.
        node_df (DataFrame): A DataFrame containing node information.

    Returns:
        list: A list of dictionaries containing the filtered node details.

    """

    filtered_nodes = []
    nodes = {
        mac: details for mac, details in csv_data.items()
        if details["GROUP_NAME"] in groups_roles_info
    }

    for _, node  in nodes.items():
        group = node["GROUP_NAME"]
        groups_roles_info[group]["mapping_status"] = True

        node_data = {
            "service_tag": node["SERVICE_TAG"],
            "hostname": node["HOSTNAME"],
            "admin_mac": node["ADMIN_MAC"],
            "admin_ip": node["ADMIN_IP"],
            "bmc_ip": node["BMC_IP"],
            "group_name": group,
            "roles": ",".join(groups_roles_info[group]["roles"]),
            "cluster_name": groups_roles_info[group]["cluster_name"],
            "location_id": groups_roles_info[group]["location_id"],
            "resource_mgr_id": groups_roles_info[group]["resource_mgr_id"],
            "parent": groups_roles_info[group]["parent"],
            "bmc_details": groups_roles_info[group]["bmc_details"],
            "switch_details": groups_roles_info[group]["switch_details"],
            "architecture": groups_roles_info[group]["architecture"],
            "hierarchical_provision_status": groups_roles_info[group].get(
                "hierarchical_provision_status", False
            )
        }
        filtered_nodes.append(node_data)

    return filtered_nodes, groups_roles_info

def main():
    """
    Main function to run the Custom ansible module for fetching mapping details.
    """
    module_args = {
        'groups_roles_info': {'type': 'dict', 'required': True},
        'mapping_file_data': {'type': 'dict', 'required': True}
    }

    module = AnsibleModule(argument_spec=module_args, supports_check_mode=True)

    try:
        groups_roles_info = module.params["groups_roles_info"]
        node_df = module.params["mapping_file_data"]

        filtered_nodes, groups_roles_info = fetch_mapping_details(groups_roles_info, node_df)

        module.exit_json(
            changed=False,
            mapping_details=filtered_nodes,
            mapping_required=bool(filtered_nodes),
            groups_roles_info=groups_roles_info
        )

    except Exception as e:
        module.fail_json(error=str(e))

if __name__ == "__main__":
    main()


================================================
FILE: common/library/modules/fetch_roles_config.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

#!/usr/bin/python

"""
This module provides functions for fetching roles from an OmniDB database.
"""

from ansible.module_utils.basic import AnsibleModule

MANAGEMENT_LAYER_ROLES = {
    "login_node_x86_64", "login_compiler_node_x86_64", "login_node_aarch64", "login_compiler_node_aarch64",
    "slurm_control_node_x86_64", "service_kube_node_x86_64"
    }
SECOND_LAYER_ROLES = {"default_x86_64", "slurm_node_x86_64", "slurm_node_aarch64"}
NON_SERVICE_ROLES = (MANAGEMENT_LAYER_ROLES | SECOND_LAYER_ROLES) - {"service_node"}

def validate_roles(roles, layer, module, management_layer_roles=MANAGEMENT_LAYER_ROLES, second_layer_roles=SECOND_LAYER_ROLES, non_service_roles=NON_SERVICE_ROLES): # type: ignore
    """
    Validates roles based on multiple conditions:
    1. Roles should only belong to either management_layer or compute-layer roles.
    2. At least one role should exist in the given layer.
    3. Groups associated with management_layer roles should not be in compute-layer roles.
    4. Groups assigned to 'service_node' should not be in other management_layer roles.

    :param roles: Dictionary where keys are role names and values are dictionaries with a 'groups'
                  key containing a list of groups.
    :param management_layer_roles: Set of management_layer role names.
    :param compute_layer_roles: Set of compute-layer role names.
    :param layer: Specifies which layer should have at least one role.
                  Should be 'first' or 'default'.
    :raises RoleValidationError: If validation fails, raises an exception with the list of errors.
    :return: True if validation passes.
    """

    # Create a mapping of roles to groups (converted to sets for efficiency)
    role_groups = {role: set(data.get("groups", [])) for role, data in roles.items()}

    defined_roles = set(roles.keys())  # Extract all roles from input

    # Check 1: Ensure all roles belong to either management_layer or compute-layer roles
    invalid_roles = defined_roles - (management_layer_roles | second_layer_roles)
    errors = []
    if invalid_roles:
        module.warn(
            f"Invalid roles detected: {invalid_roles}. \
                Roles must be from either management_layer or compute-layer roles.")

    # Check 1&2: Ensure at least one role exists in the specified layer
    if layer == "first":
        if not defined_roles.intersection(management_layer_roles):
            raise ValueError("At least one role must be from the management_layer roles.")
    else:
        if 'service_node' in defined_roles:
            if not defined_roles.intersection(second_layer_roles):
                raise ValueError(
                    f"At least one role must be defined from - \
                        {second_layer_roles} in functional_groups_config.yml")
        else:
            if not defined_roles.intersection(non_service_roles):
                raise ValueError(
                    f"At least one role must be defined from - \
                        {non_service_roles} functional_groups_config.yml")

    # Collect all groups used by management_layer and compute-layer roles
    management_layer_groups = {group for role in management_layer_roles \
                               for group in role_groups.get(role, [])}
    second_layer_groups = {group for role in second_layer_roles \
                           for group in role_groups.get(role, [])}

    # Check 3: Ensure groups from management_layer roles are not in compute-layer roles
    common_groups = management_layer_groups.intersection(second_layer_groups)
    if common_groups:
        errors.append(f"Groups {common_groups} \
                      are assigned to both management_layer and compute-layer roles.")

    # Check 4: Ensure groups in 'service_node' role are not part of other management_layer roles
    service_groups = role_groups.get("service_node", set())

    for role in management_layer_roles:
        if role != "service_node":
            overlapping_groups = service_groups.intersection(role_groups.get(role, set()))
            if overlapping_groups:
                errors.append(f"Groups {overlapping_groups} \
                              from 'service_node' role are also part of management_layer role '{role}'.")

    # Raise an error if validation fails
    if errors:
        raise ValueError("\n".join(errors))

def check_switch_required(group_data, layer):
    """Check if switch based provisioning is required."""
    if layer == 'first':
        return False
    switch_data = group_data.get("switch_details", {})
    if switch_data and switch_data.get("ip", '') and switch_data.get("ports", ''):
        return True
    else:
        return False

def check_bmc_required(group_data):
    """Check if bmc based provisioning is required."""
    bmc_data = group_data.get("bmc_details", {})
    if bmc_data and bmc_data.get("static_range", ''):
        return True
    else:
        return False

def filter_roles(roles_data, layer):
    """Filter the roles based on the layer and the roles data."""

    if layer == "first":
        valid_roles = set(roles_data.keys()).intersection(MANAGEMENT_LAYER_ROLES)
    else:
        if 'service_node' in roles_data:
            valid_roles = set(roles_data.keys()).intersection(SECOND_LAYER_ROLES)
        else:
            valid_roles = set(roles_data.keys()).intersection(NON_SERVICE_ROLES)
    return valid_roles


def roles_groups_mapping(groups_data, roles_data, layer):
    """
    Maps the roles to the groups and returns the mapping, along with some additional information.

    Parameters:
        groups_data (dict): A dictionary containing the group data.
        roles_data (dict): A dictionary containing the roles data.
        layer (str): The layer of the roles.

    Returns:
        tuple: A tuple containing the following:
            - bmc_check (bool): A boolean indicating if BMC is required.
            - switch_check (bool): A boolean indicating if switch is required.
            - hierarchical_provision_status (bool): A boolean indicating if hierarchical
                                                    provisioning is required.
            - roles_groups_data (dict): A dictionary containing the roles and groups data.
            - groups_roles_info (dict): A dictionary containing the groups and roles information.

    Raises:
        Exception: If a group doesn't exist in the functional_groups_config.yml Groups dict.
    """


    valid_roles = filter_roles(roles_data, layer)

    bmc_check = False
    switch_check = False
    roles_groups_data = {}
    groups_roles_info = {}

    for role in valid_roles:
        for group in roles_data[role]["groups"]:

            if groups_data.get(group, {}):
                groups_roles_info.setdefault(group, {}).setdefault('roles', []).append(role)
                groups_roles_info[group].update(groups_data.get(group))
                grp_bmc_check = check_bmc_required(groups_data[group])
                grp_switch_check = grp_bmc_check and check_switch_required(groups_data[group], \
                                                                           layer)
                # For a group bmc will be false if switch is true
                grp_bmc_check = False if grp_switch_check else grp_bmc_check
                switch_check = switch_check or grp_switch_check
                bmc_check = bmc_check or grp_bmc_check

                roles_groups_data[role] = {}
                roles_groups_data[role][group] = groups_data[group]
                groups_roles_info[group]["mapping_status"] = False
                groups_roles_info[group]['switch_status'] = grp_switch_check
                groups_roles_info[group]['bmc_static_status'] = grp_bmc_check

            else:
                raise ValueError(
                    f"Group '{group}' doesn't exist in functional_groups_config.yml Groups dict"
                    )

    return bmc_check, switch_check, roles_groups_data, groups_roles_info

def main():
    """
    This function is the main entry point of the Ansible module.
    It takes three parameters: roles_data, groups_data, and layer.
    The roles_data is a list of dictionaries where each dictionary
    contains the role name and other details.
    The groups_data is a dictionary where each key is a group name and the value is another
    dictionary containing group details. The layer parameter is a string that can be either
    "first" or "default". The function processes the roles and groups data, validates the roles,
    and then maps the roles to the groups. It also checks for BMC and switch requirements and
    hierarchical provisioning status. Finally, it returns the processed data in JSON format.

    Parameters:
        roles_data (list): A list of dictionaries where each dictionary contains the role name
                           and other details.
        groups_data (dict): A dictionary where each key is a group name and the value is another
                            dictionary containing group details.
        layer (str): A string that can be either "first" or "default".

    Returns:
        dict: A dictionary containing the processed data, including the roles, groups,
        and other relevant information.
    """
    module_args = dict(
        roles_data=dict(type="list", required=True),
        groups_data=dict(type="dict", required=True),
        layer=dict(type="str", choices=["first", "default"], required=True)
    )

    module = AnsibleModule(argument_spec=module_args, supports_check_mode=True)

    try:
        roles_list = module.params["roles_data"]
        groups = module.params["groups_data"]
        layer = module.params["layer"]
        roles = {role.pop('name'): role for role in roles_list}
        validate_roles(roles, layer, module)
        need_bmc, need_switch, roles_groups_data, groups_roles_info = \
            roles_groups_mapping(groups, roles, layer)
        module.exit_json(
            changed=False,
            roles_data=roles,
            groups_data=groups,
            groups_roles_info=groups_roles_info,
            roles_groups_data=roles_groups_data,
            bmc_static_status=need_bmc,
            switch_status=need_switch,
        )
    except ValueError as e:
        module.fail_json(msg=str(e))

if __name__ == "__main__":
    main()


================================================
FILE: common/library/modules/fetch_software_arch.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

#!/usr/bin/python

from ansible.module_utils.basic import AnsibleModule
from ansible.module_utils.local_repo.common_functions import(
    get_arch_from_sw_config
)
from ansible.module_utils.local_repo.software_utils import(
    load_json,
    load_yaml
)
from ansible.module_utils.local_repo.config import (
     SOFTWARE_CONFIG_PATH_DEFAULT
)

def main():
    """
    This utility extracts the architecture list for a given software in software_config.json. 
    If the architecture is not defined in the software_config, it falls back to architecture 
    values defined under each group in functional_groups_config.yml.

    Parameters:
        software_name (str): Name of the software.
        user_json_file (str): Path to software_config.json
        functional_groups_config_path (str): Path to functional_groups_config.yml

    Returns:
        arch (dict): Dictionary mapping software name to a list of architectures.
    """

    module_args = {
        "software_name": {"type": "str", "required": True},
        "user_json_file": {"type": "str", "required": False, "default": SOFTWARE_CONFIG_PATH_DEFAULT},
    }

    module = AnsibleModule(argument_spec=module_args, supports_check_mode=False)

    software_name = module.params['software_name']
    sw_config_path = module.params['user_json_file']

    try:
        sw_config_data = load_json(sw_config_path)
        result = get_arch_from_sw_config(software_name, sw_config_data)
        module.exit_json(changed=False, arch=result)
    except Exception as e:
        module.fail_json(msg=str(e))


if __name__ == '__main__':
    main()


================================================
FILE: common/library/modules/fetch_telemetry_status.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

"""Ansible module to fetch telemetry status."""
import os
import yaml
from ansible.module_utils.basic import AnsibleModule

TELEMETRY_CONFIG_FILE_NAME = "telemetry_config.yml"

def load_yaml(path):
    """
    Load YAML from a given file path.

    Args:
        path (str): The path to the YAML file.

    Returns:
        dict: The loaded YAML data.

    Raises:
        FileNotFoundError: If the file does not exist.
    """
    if not os.path.isfile(path):
        raise FileNotFoundError(f"Config file not found: {path}")
    with open(path, "r", encoding = "utf-8") as file:
        return yaml.safe_load(file)

def main():
    """
    This function is the main entry point of the Ansible module.
    It takes telemetry config file path as a parameter.

    This function loads the telemetry configuration from a YAML file,
        checks the status of various telemetry components,
        and returns the status as a list.

    Parameters:
       input_path: path to input files

    Returns:
        A list containing the telemetry status.

    Raises:
        None
    """
    module_args = {
        "input_path": {
            "type": "path", "required": True
        }
    }
    module = AnsibleModule(argument_spec=module_args)
    input_dir_path = module.params["input_path"]
    telemetry_config_path = os.path.join(input_dir_path, TELEMETRY_CONFIG_FILE_NAME)
    telemetry_config_data = load_yaml(telemetry_config_path)

    telemetry_status_list = []

    if telemetry_config_data["idrac_telemetry_support"]:
        telemetry_status_list.append("idrac_telemetry")

    module.exit_json(
            changed=False,
            telemetry_status_list=telemetry_status_list
    )


if __name__ == "__main__":
    main()


================================================
FILE: common/library/modules/functional_group_parser.py
================================================
#!/usr/bin/env python3

from ansible.module_utils.basic import AnsibleModule
import yaml


def normalize_functional_groups(data):
    """
    Accepts either a dict with key 'functional_groups', or a list of
    strings/dicts, and returns a flat list of functional group names.
    """
    if data is None:
        return []

    # If passed as a string (e.g., extra-var), parse it first
    if isinstance(data, str):
        try:
            data = yaml.safe_load(data)
        except Exception:
            return []

    if isinstance(data, dict):
        functional_groups = data.get("functional_groups", [])
    else:
        functional_groups = data

    if not isinstance(functional_groups, list):
        return []

    names = []
    for fg in functional_groups:
        if isinstance(fg, str):
            names.append(fg)
        elif isinstance(fg, dict) and "name" in fg:
            names.append(fg["name"])
    return names


def get_functional_groups(config_path):
    with open(config_path, "r") as f:
        data = yaml.safe_load(f)
    return normalize_functional_groups(data)


def main():
    module = AnsibleModule(
        argument_spec=dict(
            functional_groups_file=dict(type="str", required=True)
        ),
        supports_check_mode=True,
    )

    config_path = module.params["functional_groups_file"]

    try:
        fg_list = get_functional_groups(config_path)
        module.exit_json(changed=False, functional_groups=fg_list)
    except Exception as e:
        module.fail_json(msg=str(e))


if __name__ == "__main__":
    main()


================================================
FILE: common/library/modules/generate_argon2_password.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

#!/usr/bin/python

"""
Ansible custom module to generate Argon2 password hash.
This module uses the argon2-cffi library to generate secure Argon2 password hashes.
"""

import sys
try:
    from argon2 import PasswordHasher
    from argon2.exceptions import HashingError
except ImportError:
    print(
        "ERROR: argon2-cffi package is not installed. "
        "Please install it with: pip install argon2-cffi"
    )
    sys.exit(1)

from ansible.module_utils.basic import AnsibleModule

def generate_argon2_hash(password):
    """
    Generate an Argon2 password hash from a given password.

    Parameters:
        password (str): The password to be converted into Argon2 format.

    Returns:
        str: The Argon2 password hash.
    """
    ph = PasswordHasher()
    try:
        hash_result = ph.hash(password)
        return hash_result
    except HashingError as e:
        raise RuntimeError(f"Failed to generate Argon2 hash: {str(e)}") from e

def main():
    """
    This function is the main entry point of the Ansible module.
    It takes in a password as a parameter and generates an Argon2 password hash from it.
    The password is required and must be a string.
    The function returns the Argon2 password hash as a string.
    """
    module_args = {"password": {"type": "str", "required": True, "no_log": True}}
    module = AnsibleModule(
        argument_spec=module_args, supports_check_mode=True
    )

    try:
        password = module.params["password"]
        if not password:
            module.fail_json(msg="Password cannot be empty")

        argon2_hash = generate_argon2_hash(password)
        module.exit_json(changed=True, pswd_argon2=argon2_hash)

    except RuntimeError as e:
        module.fail_json(msg=str(e).replace("\n", " "))


if __name__ == "__main__":
    main()


================================================
FILE: common/library/modules/generate_functional_groups.py
================================================
#!/usr/bin/python

"""
Ansible module: Generate cluster functional_groups.yaml based on a CSV mapping file.
Always overwrites the YAML file with new data.
"""

import os
import csv
from collections import OrderedDict
import yaml
from ansible.module_utils.basic import AnsibleModule
from ansible.module_utils.input_validation.common_utils import config

DESCRIPTION_MAP = {
    "slurm_control_node": "Slurm Head",
    "slurm_node": "Slurm Worker",
    "login_node": "Login Node",
    "login_compiler_node": "Login Compiler Node",
    "service_kube_control_plane_first": "Kubernetes Control Plane (Primary)",
    "service_kube_control_plane": "Kubernetes Control Plane",
    "service_kube_node": "Kubernetes Worker Node"
}

def load_omnia_config(omnia_config_path, module):
    """Load omnia_config.yml and return (kube_name, slurm_name)."""
    if not os.path.exists(omnia_config_path):
        module.fail_json(msg=f"omnia_config.yml not found: {omnia_config_path}")

    try:
        with open(omnia_config_path) as f:
            config = yaml.safe_load(f) or {}

        kube_name = None
        k8s_clusters = config.get("service_k8s_cluster", [])
        if isinstance(k8s_clusters, list) and k8s_clusters:
            for cluster in k8s_clusters:
                if cluster.get("deployment") is True:
                    kube_name = cluster.get("cluster_name")
                    break
            if kube_name is None:
                kube_name = k8s_clusters[0].get("cluster_name")

        slurm_name = None
        slurm_clusters = config.get("slurm_cluster", [])
        if isinstance(slurm_clusters, list) and slurm_clusters:
            slurm_name = slurm_clusters[0].get("cluster_name")

        return kube_name, slurm_name

    except Exception as e:
        error_msg = f"Failed to load omnia_config.yml: {str(e)}"
        module.fail_json(msg=error_msg)


def parse_csv(filename, module):
    """Parse CSV file and extract groups and functional groups."""
    groups = {}
    functional_groups = {}
    kube_control_seen = False

    try:
        with open(filename, newline="") as f:
            cleaned_lines = [line.strip() for line in f if line.strip()]
            header = cleaned_lines[0].split(",")
            expected_columns = len(header)
            valid_lines = [
                line for line in cleaned_lines if len(line.split(",")) == expected_columns
            ]

            reader = csv.DictReader(valid_lines)

            for row in reader:
                func_group = row["FUNCTIONAL_GROUP_NAME"].strip()
                group_name = row["GROUP_NAME"].strip()
                parent = row.get("PARENT_SERVICE_TAG", "").strip() or ""

                if func_group == "service_kube_control_plane_x86_64" and not kube_control_seen:
                    func_group = "service_kube_control_plane_first_x86_64"
                    kube_control_seen = True

                groups[group_name] = {"parent": parent}
                if func_group in config.FUNCTIONAL_GROUP_LAYER_MAP:
                    functional_groups.setdefault(func_group, set()).add(group_name)

        return groups, functional_groups

    except Exception as e:
        error_msg = f"Error parsing CSV file: {str(e)}"
        module.fail_json(msg=error_msg)

def build_yaml(new_groups, new_func_groups, kube_cluster_name, slurm_cluster_name):
    """Build YAML structure with groups and functional groups."""
    data = OrderedDict({"groups": OrderedDict(), "functional_groups": []})

    # Add groups
    for grp, details in new_groups.items():
        data["groups"][grp] = details

    # Add functional groups
    for func_group, group_list in new_func_groups.items():
        layer = config.FUNCTIONAL_GROUP_LAYER_MAP[func_group]
        fg_lower = func_group.lower()
        # get appropriate cluster name
        cluster_name = (
            kube_cluster_name
            if "kube" in fg_lower
            else slurm_cluster_name or "slurm_cluster"
        )

        desc_key = next((k for k in DESCRIPTION_MAP if func_group.startswith(k)), func_group)
        description = DESCRIPTION_MAP.get(desc_key, func_group)

        new_entry = OrderedDict({
            "name": func_group,
            "cluster_name": cluster_name,
            "group": sorted(list(group_list)),
            "_comment": [
                f"{description} functional_groups:",
                f"This functional_group is used to configure the nodes for {description}. "
                f"It belongs to the {layer} layer.",
                f"The nodes included in this functional_group will have the necessary tools "
                f"and configurations to run {description}.",
                f"The nodes in this functional_group can be used to run {description}."
            ]
        })
        data["functional_groups"].append(new_entry)

    return data

def dump_yaml_with_comments(data, filename):
    """Write YAML data to file with custom formatting and comments."""
    with open(filename, "w") as f:
        f.write("# ---------------------------------------------------------------------------\n")
        f.write("# Groups definition\n")
        f.write("# ---------------------------------------------------------------------------\n")
        f.write("groups:\n")
        for g in sorted(data["groups"].keys()):
            d = data["groups"][g]
            f.write(f"  {g}:\n")
            f.write(f"    parent: \"{d['parent']}\"\n")

        f.write("\n# -------------------------------------------------------------------------\n")
        f.write("# Functional Groups definition\n")
        f.write("# ---------------------------------------------------------------------------\n")
        f.write("functional_groups:\n")
        for fg in data.get("functional_groups") or []:
            for comment in fg.get("_comment", []):
                f.write(f"  # {comment}\n")
            f.write(f"  - name: \"{fg['name']}\"\n")
            f.write(f"    cluster_name: \"{fg['cluster_name']}\"\n")
            f.write(f"    group:\n")
            for g in sorted(set(fg["group"])):
                f.write(f"      - {g}\n")
            f.write("\n")

def main():
    """Initialize Ansible module for generating functional groups."""
    module_args = {
        "mapping_file_path": {"type": "str", "required": True},
        "functional_groups_file_path": {"type": "str", "required": True},
        "omnia_config_path": {"type": "str", "required": True},
    }

    module = AnsibleModule(argument_spec=module_args, supports_check_mode=True)

    mapping_file_path = module.params["mapping_file_path"]
    functional_groups_file_path = module.params["functional_groups_file_path"]
    omnia_config_path = module.params["omnia_config_path"]

    try:
        if not os.path.exists(mapping_file_path):
            module.fail_json(msg=f"CSV file not found: {mapping_file_path}")

        kube_cluster_name, slurm_cluster_name = load_omnia_config(omnia_config_path, module)
        new_groups, new_func_groups = parse_csv(mapping_file_path, module)

        # Always overwrite: build fresh YAML
        yaml_data = build_yaml(new_groups, new_func_groups, kube_cluster_name, slurm_cluster_name)
        dump_yaml_with_comments(yaml_data, functional_groups_file_path)

        module.exit_json(
            changed=True,
            msg=f"functional_groups_config.yml file overwritten: {functional_groups_file_path}",
            added_groups=list(new_groups.keys()),
            added_functional_groups=list(new_func_groups.keys())
        )

    except Exception as e:
        error_msg = f"Error while generating functional groups YAML: {str(e)}"
        module.fail_json(msg=error_msg)

if __name__ == "__main__":
    main()


================================================
FILE: common/library/modules/generate_ssha_password.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

#!/usr/bin/python

"""
Ansible custom module to append 'ip=<ip>' to each relevant line in the inventory file.
It reads the `src` file, appends `ip=` for matching IPs or ansible_host values,
and writes the result to `dest`.
"""

import hashlib
import base64
import os
import sys
from passlib.hash import ldap_sha1 as lsm

from ansible.module_utils.basic import AnsibleModule

def generate_ssha(password):
    """
    Generate a SSHA password from a given password.

    Parameters:
        password (str): The password to be converted into SSHA format.

    Returns:
        str: The SSHA password.
    """
    salt = os.urandom(4)
    sha = hashlib.sha1(password.encode('utf-8'))
    sha.update(salt)
    return '{SSHA}' + base64.b64encode(sha.digest() + salt).decode('utf-8')

def get_hash(passwd):
    """
    Get the hash of a given password.

    Parameters:
        passwd (str): The password to be hashed.

    Returns:
        str: The hashed password.
    """
    hashed = lsm.hash(passwd)
    return hashed

def main():
    """
    This function is the main entry point of the Ansible module.
    It takes in a password as a parameter and generates an SSHA password from it.
    The password is required and must be a string.
    The function returns the SSHA password as a string.
    """
    module_args = dict(
        password=dict(type="str", required=True)
    )
    module = AnsibleModule(argument_spec=module_args, supports_check_mode=True)
    try:
        pswd_plain_txt = module.params["password"]
        #pswd_ssha = generate_ssha(pswd_plain_txt)
        pswd_ssha = get_hash(pswd_plain_txt)
        module.exit_json(changed=True, pswd_ssha=pswd_ssha)
    except Exception as e:
        module.fail_json(msg=str(e).replace('\n', ' '))


if __name__ == "__main__":
    main()


================================================
FILE: common/library/modules/generate_xname_in_mapping_file.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

# pylint: disable=import-error,no-name-in-module,line-too-long
#!/usr/bin/python

import pandas as pd
from ansible.module_utils.basic import AnsibleModule

def generate_xname_in_mapping_file(mapping_file_path, module):
    """
    Generates xname in mapping file:
    Parameters:
        mapping_file_path (str): The path to the mapping file.
        module (AnsibleModule): The Ansible module instance for handling exit and failure.
    """
    try:
        csv_file = pd.read_csv(mapping_file_path)
        if len(csv_file) == 0:
            module.fail_json(msg="Please provide details in mapping file.")

        # Strip whitespace from column values and names
        csv_file = csv_file.apply(lambda x: x.str.strip() if x.dtype == 'object' else x)
 
        # The resulting XNAME values will have the format 'x1000c0s<d><b><d>n0', where <b> is a letter and <d> is a digit
        xname_values = []

        for i in range(len(csv_file)):
            # `c` will be based on i // 100 (every 100 entries we increment `c`)
            c_index = i // 100
            # `s` will be based on i // 10 (every 10 entries we increment `s`)
            s_index = (i // 10) % 10
            # `digit` cycles from 0 to 9
            digit = i % 10
            # Build the 'xname' with updated logic for `c` and `s` indices
            xname = f'x1000c{c_index}s{s_index}b{digit}n0'
            xname_values.append(xname)

        csv_file['XNAME'] = xname_values

        # Update the mapping file with the new XNAME values
        csv_file.to_csv(mapping_file_path, index=False)

        # If all checks pass
        module.exit_json(changed=False, msg="Xnames are generated successfully in the mapping file.")

    except Exception as e:
        module.fail_json(msg=str(e))

def main():
    """
	Validate a mapping file.

	Parameters:
		mapping_file_path (str): The path to the mapping file.

	"""
    module_args = {
        'mapping_file_path': {'type': 'path', 'required': True }
    }

    module = AnsibleModule(argument_spec=module_args, supports_check_mode=False)
    mapping_file_path = module.params.get('mapping_file_path')

    generate_xname_in_mapping_file(mapping_file_path, module)


if __name__ == "__main__":
    main()


================================================
FILE: common/library/modules/get_service_cluster_info.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

# pylint: disable=import-error,no-name-in-module,line-too-long

#!/usr/bin/python

"""Ansible module to check telemetry service cluster node details."""

import yaml
from ansible.module_utils.basic import AnsibleModule

def load_functional_groups_yaml(path, module):
    """Load functional group names from YAML."""
    try:
        with open(path, 'r') as f:
            data = yaml.safe_load(f)
        return data.get("groups", {})
    except ValueError as e:
        module.fail_json(msg=f"Failed to load functional_groups_config.yml: {str(e)}")

def get_service_cluster_node_details(nodes_info):
    """
    This function retrieves all service cluster node data from the database.
    Returns a dictionary of service cluster node data.
    """

    data = {}

    for sn in nodes_info:
        node = sn['name']
        service_tag = sn['description']
        role = sn['group']
        # cluster_name =  next((g["cluster_name"] for g in functional_groups_info if g["name"] == role), None)

        if "service_kube_node_x86_64" in role or "service_kube_node_aarch64" in role:
            data[service_tag] = {
                'service_tag': service_tag,
                'node': node,
                # 'cluster_name': cluster_name,
                'role': role
            }

    data['MGMT_node'] = {'parent_status' : True, 'service_tag' : 'MGMT_node', 'role': 'service_kube_control_plane'}
    return data

def check_service_cluster_node_details(group, parent, service_cluster_node_details):
    """Check if service cluster node details are available."""

    if not parent:
        return False
    if parent in service_cluster_node_details:
        return True
    raise ValueError(
            f"Error: The service tag '{parent}' specified in the 'parent' field for group '{group}' "
            "may be incorrect, or the node might not be available. "
            "Please verify the input and try again."
        )

def get_service_cluster_data(groups_info, service_cluster_node_details, bmc_group_data):
    """
    Generate service cluster node details by analyzing group relationships and BMC group data.

    This function checks the service cluster node details for each group,
    and adds child group data to service_cluster_node_details. It also checks
    if a parent has child groups in the bmc_group_data and adds them to the parent_data.

    Args:
        groups_info (dict): Dictionary containing group information.
        service_cluster_node_details (dict): Dictionary containing service cluster node information.
        bmc_group_data (list): List of dictionaries containing BMC group data.

    Returns:
        dict: Updated service_cluster_node_details.
    """

    for group, group_data in groups_info.items():
        parent = group_data.get("parent", "")

        # Skip if service cluster node details check fails
        if not check_service_cluster_node_details(group, parent, service_cluster_node_details):
            continue

        # Initialize parent data
        parent_data = service_cluster_node_details.get(parent, {})
        parent_data.setdefault("child_groups", [])

        # Add current group to child_groups if not already present
        if group and group not in parent_data["child_groups"]:
            parent_data["child_groups"].append(group)

        # Add child groups from bmc_group_data
        for entry in bmc_group_data:
            if entry.get("PARENT") == parent:
                bmc_group = entry.get("GROUP_NAME")
                if bmc_group and bmc_group not in parent_data["child_groups"]:
                    parent_data["child_groups"].append(bmc_group)

        # Set parent_status if there are any child groups
        if parent_data["child_groups"]:
            parent_data["parent_status"] = True

        # Update the service_cluster_node_details dictionary
        service_cluster_node_details[parent] = parent_data


    return service_cluster_node_details

def main():
    """
        Main function to execute the check_service_cluster_node_details custom module.
    """
    module_args = {
        'nodes_info': {'type':"list", 'required':True},
        'functional_groups_file_path': {'type':"path", 'required':True},
        'bmc_group_data': {'type':"list", 'required':True}
    }

    module = AnsibleModule(argument_spec=module_args, supports_check_mode=True)

    try:
        nodes_info = module.params["nodes_info"]
        bmc_group_data = module.params["bmc_group_data"]
        functional_groups_file_path = module.params["functional_groups_file_path"]
        groups_info = load_functional_groups_yaml(functional_groups_file_path, module)
        service_cluster_node_details = get_service_cluster_node_details(nodes_info)
        service_cluster_node_details = get_service_cluster_data(groups_info, service_cluster_node_details, bmc_group_data)

        module.exit_json(
            changed=False,
            service_cluster_node_details = service_cluster_node_details
        )
    except ValueError as e:
        module.fail_json(msg=str(e).replace('\n', ' '))

if __name__ == "__main__":
    main()


================================================
FILE: common/library/modules/group_package_map.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

#!/usr/bin/python

"""Ansible module for omnia for group package mapping"""

import os
import json
import yaml
from ansible.module_utils.basic import AnsibleModule

RPM_LIST_BASE = "rpm"
REBOOT_KEY = "reboot_required"

# Read JSON file


def read_json_file(file_path, module):
    """
    Reads a JSON file and returns its data.

    Args:
        file_path (str): The path to the JSON file.

    Returns:
        dict: The loaded JSON data.
    """
    if not os.path.exists(file_path):
        module.exit_json(failed=True, msg=f"File not found: {file_path}")
    try:
        with open(file_path, 'r', encoding='utf-8') as file:
            data = json.load(file)
    except json.JSONDecodeError as exc:
        module.exit_json(failed=True, msg=f"Error loading JSON {file_path}: {exc}")
    return data

# Read YAML file


def read_functional_groups_config(file_path, module):
    """
    Reads a YAML file containing roles configuration and
     returns the roles configuration and all groups.

    Args:
        file_path (str): The path to the YAML file.

    Returns:
        tuple: A tuple containing a dictionary of roles configuration and a list of all groups.
    """
    if not os.path.exists(file_path):
        module.exit_json(failed=True, msg=f"File not found: {file_path}")
    try:
        with open(file_path, 'r', encoding='utf-8') as file:
            data = yaml.safe_load(file)
    except yaml.YAMLError as exc:
        module.exit_json(failed=True, msg=f"Error loading YAML {file_path}: {exc}")
    role_cfg = {item['name']: item['groups'] for item in data.get('Roles', [])}
    all_groups = list(data.get('Groups', {}).keys())
    return role_cfg, all_groups


def careful_merge(split_dict, split_key, value):
    """
    Carefully merges a dictionary with a given key and value.

    Args:
        split_dict (dict): The dictionary to merge into.
        split_key (str): The key to merge into the dictionary.
        value (dict): The dictionary to merge.

    Returns:
        None
    """
    val_d = split_dict.get(split_key, {})
    for key, val in value.items():
        if key == REBOOT_KEY:
            val_d[key] = val_d.get(key, False) or val
            continue
        got_existing_list = val_d.get(key, []) + val
        # Order matters?
        val_d[key] = list(set(got_existing_list))  # remove duplicates
    split_dict[split_key] = val_d


def split_comma_keys(input_dict):
    """
    Splits a dictionary's keys by commas and merges the values into a new dictionary.

    Args:
        input_dict (dict): The input dictionary with comma-separated keys.

    Returns:
        dict: A new dictionary with split keys and merged values.
    """
    split_dict = {}
    for key, value in input_dict.items():
        split_keys = [k.strip() for k in key.split(',')]
        for split_key in split_keys:
            careful_merge(split_dict, split_key, value)
    return split_dict


def get_type_dict(clust_list):
    """
    Returns a dictionary of package types and their corresponding package lists.

    Args:
        clust_list (list): A list of dictionaries containing package information.

    Returns:
        dict: A dictionary of package types and their corresponding package lists.
    """
    type_dict = {}
    for pkg_dict in clust_list:
        pkgtype = pkg_dict.get('type')
        if pkgtype == 'rpm_list':
            # Add package_list to RPM_LIST_BASE
            type_dict[RPM_LIST_BASE] = type_dict.get(
               RPM_LIST_BASE, []) + pkg_dict.get('package_list')

        elif pkgtype == 'image' and pkg_dict.get('tag') is not None:
            # Add package:tag to type_dict
            type_dict[pkgtype] = type_dict.get(
                pkgtype, []) + [pkg_dict.get('package') + ":" + pkg_dict.get('tag')]

        elif pkgtype == 'image' and pkg_dict.get('digest') is not None:
            # Add package@sha256:digest to type_dict
            type_dict[pkgtype] = type_dict.get(
                pkgtype, []) + [pkg_dict.get('package') + '@sha256:' + pkg_dict.get('digest')]

        elif pkgtype == 'rpm':  # rpm
                # Add package to rpm key
            type_dict[pkgtype] = type_dict.get(
                pkgtype, []) + [pkg_dict.get('package')]
            # Also track repo_name mapping for RPMs
            if 'repo_mapping' not in type_dict:
                type_dict['repo_mapping'] = {}
            type_dict['repo_mapping'][pkg_dict.get('package')] = pkg_dict.get('repo_name', '')

        # Update reboot required values
        reboot_val = pkg_dict.get(REBOOT_KEY, False)
        type_dict[REBOOT_KEY] = type_dict.get(REBOOT_KEY, False) or reboot_val

    return type_dict


def modify_addl_software(addl_dict):
    """
    Modifies the additional software dictionary by generating
      a type dictionary for each cluster list.

    Args:
        addl_dict (dict): A dictionary of additional software.

    Returns:
        dict: A dictionary of package types and their corresponding package lists.
    """
    new_dict = {}
    for key, value in addl_dict.items():
        clust_list = value.get('cluster', [])
        type_dict = get_type_dict(clust_list)
        new_dict[key] = type_dict
    return new_dict


def main():
    """
    The main function is the entry point for the Ansible module.
     It processes the input parameters and returns the group package map.

    Args:
        software_bundle (path): The path to the software bundle.
        roles_config (path): The path to the roles configuration file.
        software_config (path): The path to the software configuration file.
        input_path (path): The path to the input path.
        software_bundle_key (str): The key for the software bundle.
        Defaults to 'additional_software'.

    Returns:
        dict: A dictionary containing the group package map.
    """
    module = AnsibleModule(
        argument_spec={
            'software_bundle': {'type': 'path'},
            'roles_config': {'type': 'path'},
            'software_config': {'type': 'path'},
            'input_path': {'type': 'path'},
            'software_bundle_key': {'type': 'str', 'default': 'additional_software'}
        },
        mutually_exclusive=[
            ('input_path', 'software_config'),
            ('input_path', 'roles_config'),
            ('input_path', 'software_bundle')
        ],
        required_one_of=[
            ('input_path', 'software_config', 'roles_config', 'software_bundle')
        ],
        required_together=[
            ('software_config', 'roles_config', 'software_bundle')
        ],
        supports_check_mode=True
    )

    inp_path = module.params.get('input_path')
    addl_key = module.params['software_bundle_key']
    if inp_path:
        inp_path = inp_path.rstrip('/')
        if not os.path.isdir(inp_path):
            module.exit_json(failed=True, msg=f"{inp_path} is not a directory")
        sw_cfg_path = inp_path + '/software_config.json'
        sw_cfg_data = read_json_file(sw_cfg_path, module)
        addl_soft = f"{inp_path}/config/{sw_cfg_data['cluster_os_type']}/{sw_cfg_data['cluster_os_version']}/{addl_key}.json"
        roles_config = f"{inp_path}/roles_config.yml"
    else:
        addl_soft = module.params.get('software_bundle')
        roles_config = module.params.get('roles_config')
        sw_cfg_data = read_json_file(module.params.get('software_config'), module)

    sw_list = [sw_dict.get('name') for sw_dict in sw_cfg_data.get('softwares')]
    if addl_key not in sw_list:
        module.exit_json(
            msg=f"{addl_key} not found in {sw_list}",
            grp_pkg_map={})
    req_addl_soft_list = [
        sub_group.get('name') for sub_group in sw_cfg_data.get(
            addl_key, [])]
    req_addl_soft_list.append(addl_key)  # add the additional_software key

    addl_soft_json_data = read_json_file(addl_soft, module)
    req_addl_soft = {sub_group: addl_soft_json_data.get(
        sub_group) for sub_group in req_addl_soft_list}

    roles_dict, all_groups = read_roles_config(roles_config, module)
    temp_addl_pkgs = req_addl_soft.pop(addl_key, {})
    key = ','.join(all_groups)
    req_addl_soft.setdefault(key, {'cluster': []})['cluster'].extend(temp_addl_pkgs['cluster'])
    addl_software_dict = modify_addl_software(req_addl_soft)
    split_comma_dict = split_comma_keys(addl_software_dict)

    # intersection of split_comma_dict and roles_yaml_data
    common_roles = split_comma_dict.keys() & roles_dict.keys()

    for role in common_roles:
        bundle = split_comma_dict.pop(role)
        group_list = roles_dict.get(role)
        for grp in group_list:
            careful_merge(split_comma_dict, grp, bundle)

    changed = True
    module.exit_json(
        changed=changed,
        grp_pkg_map=split_comma_dict,
        msg="Successfully fetched and mapped groups and packages")


if __name__ == "__main__":
    main()


================================================
FILE: common/library/modules/idrac_telemetry_filter.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

# pylint: disable=import-error

#!/usr/bin/python

import traceback
import requests
from requests.auth import HTTPBasicAuth
from requests import packages

from ansible.module_utils.basic import AnsibleModule
from ansible.module_utils._text import to_native

packages.urllib3.disable_warnings()

def get_bmc_license_info(bmc_ip, username, password, module):
    """
	Queries the BMC for license information.

	Parameters:
	- bmc_ip (str): The BMC's IP address.
	- username (str): The BMC's username.
	- password (str): The BMC's password.
	- module (AnsibleModule): The Ansible module.

	Returns:
	- bool: True if the BMC has a valid Datacenter license, False otherwise.
	"""

    licenses_url = f"https://{bmc_ip}/redfish/v1/Managers/iDRAC.Embedded.1/Oem/Dell/DellLicenses"

    try:
        # Get the license details
        response = requests.get(
            licenses_url,
            verify=False,
            timeout=30,
            auth=HTTPBasicAuth(username, password))
        response.raise_for_status()

        # Extract the license data from the response
        license_data = response.json()

        for license_info in license_data.get("Members", []):
            # Initialize a dictionary to track conditions for this specific license
            conditions = {
                "iDRAC": False,
                "Data": False,
                "License": False,
                "Healthy": False
            }
            # Check LicenseDescription and LicensePrimaryStatus fields
            license_desc = license_info.get("LicenseDescription", [])
            license_primary_status = license_info.get("LicensePrimaryStatus", "")

            # Check for the required conditions in LicenseDescription
            if any("idrac" in desc.lower() for desc in license_desc):
                conditions["iDRAC"] = True
            if any("data" in desc.lower() for desc in license_desc):
                conditions["Data"] = True
            if any("license" in desc.lower() for desc in license_desc):
                conditions["License"] = True

            # Check if LicensePrimaryStatus is "Healthy"
            if "ok" in license_primary_status.lower():
                conditions["Healthy"] = True

            # Output the results based on the conditions
            if all(conditions.values()):
                return True
        module.warn(f"The system {bmc_ip} does not meet all the required license conditions.")
        return False

    except requests.exceptions.RequestException as err:
        module.warn(f"Error querying iDRAC licenses: {err}")
        return False


def get_bmc_firmware_info(bmc_ip, username, password, module, min_firmware_version_reqd):
    """
	Queries the BMC for firmware information.

	Parameters:
	- bmc_ip (str): The BMC's IP address.
	- username (str): The BMC's username.
	- password (str): The BMC's password.
	- module (AnsibleModule): The Ansible module.
	- min_firmware_version_reqd (int): The minimum required firmware version.

	Returns:
	- bool: True if the BMC's firmware version meets the minimum required version, False otherwise.
	"""

    manager_url = f"https://{bmc_ip}/redfish/v1/Managers/iDRAC.Embedded.1"

    try:
        # Get the iDRAC manager details
        response = requests.get(
            manager_url,
            verify=False,
            timeout=30,
            auth=HTTPBasicAuth(username, password))
        response.raise_for_status()

        # Extract the firmware version from the response
        manager_data = response.json()
        firmware_version = manager_data.get("FirmwareVersion", "Unknown")
        try:
            # Split the firmware version and convert to integer
            split_version = firmware_version.split('.')
            firmware_version_int = int(split_version[0])
        except (ValueError, IndexError) as e:
            module.warn(f"Error converting firmware version {firmware_version} to integer: {e}")
            firmware_version_int = 0

        if firmware_version_int >= min_firmware_version_reqd:
            return True

        module.warn(f"The system {bmc_ip} does not meet the minimum required firmware version.")
        return False

    except requests.exceptions.RequestException as err:
        module.warn(f"Error querying iDRAC manager: {err}")
        return False


def main():
    """
	Ansible module to filter BMCs based on their firmware version and license status.

	Parameters:
	- bmc_ip_list (list): List of BMC IPs to filter.
	- bmc_username (str): BMC username for authentication.
	- bmc_password (str): BMC password for authentication.
	- min_firmware_version_reqd (int): Minimum firmware version required for BMCs.

	Returns:
	- telemetry_idrac (list): List of BMC IPs that meet the requirements.
	- failed_idrac (list): List of BMC IPs that do not meet the requirements.
	- telemetry_idrac_count (int): Number of BMCs that meet the requirements.
	- failed_idrac_count (int): Number of BMCs that do not meet the requirements.
	"""

    # Define the module arguments
    module_args = {
        "bmc_ip_list": {"type": "list", "required": True},
        "bmc_username": {"type": "str", "required": True},
        "bmc_password": {"type": "str", "required": True, "no_log": True},
        "min_firmware_version_reqd": {"type": "int", "required": True}
    }

    # Create the Ansible module
    module = AnsibleModule(argument_spec=module_args)

    result = {
        "telemetry_idrac": [],
        "failed_idrac": [],
        "telemetry_idrac_count": 0,
        "failed_idrac_count": 0
    }

    bmc_ip_list = module.params['bmc_ip_list']
    bmc_username = module.params['bmc_username']
    bmc_password = module.params['bmc_password']
    min_firmware_version_reqd = module.params['min_firmware_version_reqd']

    try:

        for bmc_ip in bmc_ip_list:
            try:
                license_status = get_bmc_license_info(
                    bmc_ip, bmc_username, bmc_password, module
                )

                firmware_status = get_bmc_firmware_info(
                    bmc_ip, bmc_username, bmc_password, module, min_firmware_version_reqd
                )

                if license_status and firmware_status:
                    result["telemetry_idrac"].append(bmc_ip)
                    result["telemetry_idrac_count"] += 1
                else:
                    result["failed_idrac"].append(bmc_ip)
                    result["failed_idrac_count"] += 1

            except Exception:
                result["failed_idrac"].append(bmc_ip)
                result["failed_idrac_count"] += 1
                continue

        module.exit_json(**result)

    except Exception as e:
        module.fail_json(
            msg=f"Unexpected failure: {to_native(e)}", exception=traceback.format_exc()
        )

if __name__ == '__main__':
    main()


================================================
FILE: common/library/modules/image_package_collector.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

# pylint: disable=import-error,no-name-in-module
#!/usr/bin/python

import os
from ansible.module_utils.basic import AnsibleModule
from ansible.module_utils.build_image.config import ROLE_SPECIFIC_KEYS
from ansible.module_utils.build_image.common_functions import (
    load_json_file,
    load_yaml_file,
    is_additional_packages_enabled,
    get_allowed_additional_subgroups,
    deduplicate_list
)

def get_additional_packages_for_role(additional_json_path, role_name, module):
    """
    Get RPM packages for a specific role from additional_packages.json.

    Args:
        additional_json_path (str): Path to additional_packages.json.
        role_name (str): Role name (e.g., 'slurm_control_node').
        module: Ansible module instance.

    Returns:
        list: List of RPM package names for the role.
    """
    if not additional_json_path or role_name not in ROLE_SPECIFIC_KEYS:
        return []

    data = load_json_file(additional_json_path, module)
    if not data or role_name not in data:
        return []

    role_data = data.get(role_name, {})
    cluster_items = role_data.get('cluster', [])

    packages = []
    for item in cluster_items:
        if item.get('type') == 'rpm' and item.get('package'):
            packages.append(item['package'])

    return packages

def normalize_functional_groups(raw_fgs, module):
    """Normalize functional_groups input into a list of strings."""
    if raw_fgs is None:
        return []

    # Accept YAML/JSON string from extra-vars
    if isinstance(raw_fgs, str):
        try:
            raw_fgs = yaml.safe_load(raw_fgs)
        except Exception as exc:  # pragma: no cover - defensive
            module.fail_json(msg=f"Unable to parse functional_groups: {exc}")

    # If provided as dict with key functional_groups
    if isinstance(raw_fgs, dict):
        raw_fgs = raw_fgs.get("functional_groups", [])

    if not isinstance(raw_fgs, list):
        module.fail_json(msg="functional_groups must be a list of strings")

    fgs = []
    for fg in raw_fgs:
        if isinstance(fg, str):
            fgs.append(fg)
        elif isinstance(fg, dict) and "name" in fg:
            fgs.append(fg["name"])
        else:
            module.fail_json(msg="functional_groups items must be strings or dicts with 'name'")
    return fgs


def collect_packages_from_json(sw_data, fg_name=None,
                               slurm_defined=False,
                               service_k8s_defined=False):
    """
    Collect RPM package names from a JSON-like dictionary of software data.
    """
    packages = []

    if slurm_defined:
        fg_name = fg_name.replace("_aarch64", "").replace("_x86_64", "")

        if "slurm_custom" in sw_data and "cluster" in sw_data["slurm_custom"]:
            for entry in sw_data["slurm_custom"]["cluster"]:
                if entry.get("type") == "rpm" and "package" in entry:
                    packages.append(entry["package"])

        if fg_name in sw_data and "cluster" in sw_data[fg_name]:
            for entry in sw_data[fg_name]["cluster"]:
                if entry.get("type") == "rpm" and "package" in entry:
                    packages.append(entry["package"])

    elif service_k8s_defined:
        fg_name = fg_name.replace("_aarch64", "").replace("_x86_64", "")

        if "service_k8s" in sw_data and "cluster" in sw_data["service_k8s"]:
            for entry in sw_data["service_k8s"]["cluster"]:
                if entry.get("type") == "rpm" and "package" in entry:
                    packages.append(entry["package"])

        if fg_name in sw_data and "cluster" in sw_data[fg_name]:
            for entry in sw_data[fg_name]["cluster"]:
                if entry.get("type") == "rpm" and "package" in entry:
                    packages.append(entry["package"])

    else:
        for section_data in sw_data.values():
            if isinstance(section_data, dict) and "cluster" in section_data:
                for entry in section_data["cluster"]:
                    if entry.get("type") == "rpm" and "package" in entry:
                        packages.append(entry["package"])

        if "cluster" in sw_data and isinstance(sw_data["cluster"], list):
            for entry in sw_data["cluster"]:
                if entry.get("type") == "rpm" and "package" in entry:
                    packages.append(entry["package"])

    return packages


def process_functional_group(fg_name, arch, os_version, input_project_dir,
                             software_map, allowed_softwares, module):
    """
    Process a single functional group and return its package list.
    """
    group_path = os.path.join(
        input_project_dir, "config", arch, "rhel", os_version
    )

    if not os.path.isdir(group_path):
        module.log(f"Directory not found: {group_path}")
        return []

    json_files = software_map.get(fg_name, [])
    packages = []

    for json_file in json_files:
        sw_name = json_file.replace(".json", "")
        if sw_name not in allowed_softwares:
            continue

        sw_path = os.path.join(group_path, json_file)
        if not os.path.isfile(sw_path):
            module.log(f"File not found: {sw_path}")
            continue

        sw_data = load_json_file(sw_path, module)
        if not sw_data:
            continue

        if json_file == "slurm_custom.json":
            packages.extend(
                collect_packages_from_json(
                    sw_data, fg_name=fg_name, slurm_defined=True
                )
            )
        elif json_file == "service_k8s.json":
            packages.extend(
                collect_packages_from_json(
                    sw_data, fg_name=fg_name, service_k8s_defined=True
                )
            )
        else:
            packages.extend(collect_packages_from_json(sw_data))

    # Deduplicate while preserving order
    return deduplicate_list(packages)


def run_module():
    """
    Entry point for the Ansible module.
    """

    module_args = dict(
        # allow raw to support YAML/JSON string or list
        functional_groups=dict(type="raw", required=True),
        software_config_file=dict(type="str", required=True),
        input_project_dir=dict(type="str", required=True),
        additional_json_path=dict(type="str", required=False, default=""),
    )

    result = dict(
        changed=False,
        compute_images_dict={}
    )

    module = AnsibleModule(
        argument_spec=module_args,
        supports_check_mode=True
    )

    functional_groups = normalize_functional_groups(
        module.params["functional_groups"], module
    )
    software_config_file = module.params["software_config_file"]
    input_project_dir = module.params["input_project_dir"]
    additional_json_path = module.params["additional_json_path"]

    software_config = load_json_file(software_config_file, module)
    if not software_config:
        module.fail_json(msg="Failed to load software_config.json")

    os_version = software_config.get("cluster_os_version")
    if not os_version:
        module.fail_json(msg="cluster_os_version not found in software_config.json")

    allowed_softwares = {
        sw["name"] for sw in software_config.get("softwares", [])
    }

    # Check if additional_packages is enabled and get allowed subgroups
    additional_enabled = is_additional_packages_enabled(software_config)
    allowed_additional_subgroups = get_allowed_additional_subgroups(software_config) if additional_enabled else []

    # pylint: disable=line-too-long
    # Functional group → json files mapping
    software_map = {
        "default_x86_64": ["openldap.json"],
        "service_kube_node_x86_64": ["service_k8s.json"],
        "service_kube_control_plane_first_x86_64": ["service_k8s.json"],
        "service_kube_control_plane_x86_64": ["service_k8s.json"],
        "slurm_control_node_x86_64": ["slurm_custom.json", "openldap.json", "ldms.json"],
        "slurm_node_x86_64": ["slurm_custom.json", "openldap.json", "ldms.json"],
        "login_node_x86_64": ["slurm_custom.json", "openldap.json", "ldms.json"],
        "login_compiler_node_x86_64": [
            "slurm_custom.json", "openldap.json",
            "ucx.json", "openmpi.json", "ldms.json"
        ],
        "slurm_node_aarch64": ["slurm_custom.json", "openldap.json", "ldms.json"],
        "login_node_aarch64": ["slurm_custom.json", "openldap.json", "ldms.json"],
        "login_compiler_node_aarch64": [
            "slurm_custom.json", "openldap.json", "ldms.json"
        ],
    }

    compute_images_dict = {}

    for fg_name in functional_groups:

        if fg_name.endswith("_x86_64"):
            arch = "x86_64"
        elif fg_name.endswith("_aarch64"):
            arch = "aarch64"
        else:
            arch = "x86_64"

        # Base role name without architecture suffix, used for role-specific
        # additional packages lookups
        base_name = fg_name.replace("_x86_64", "").replace("_aarch64", "")

        packages = process_functional_group(
            fg_name, arch, os_version, input_project_dir,
            software_map, allowed_softwares, module
        )

        # Add role-specific packages from additional_packages.json if enabled
        if additional_enabled and base_name in allowed_additional_subgroups:
            additional_role_pkgs = get_additional_packages_for_role(
                additional_json_path, base_name, module
            )
            packages.extend(additional_role_pkgs)
            packages = deduplicate_list(packages)

        compute_images_dict[fg_name] = {
            "functional_group": fg_name,
            "packages": packages
        }

    result["compute_images_dict"] = compute_images_dict
    module.exit_json(**result)


def main():
    run_module()


if __name__ == "__main__":
    main()


================================================
FILE: common/library/modules/insert_idracips_mysqldb.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

#!/usr/bin/python
"""Module to insert iDRAC IPs into MySQL database.
This module connects to a Kubernetes pod running MySQL and inserts iDRAC IPs with
associated service type and authentication details.
It handles retries and delays for robustness."""

import time
import json
from ansible.module_utils.basic import AnsibleModule
from kubernetes import client, config
from kubernetes.stream import stream
from kubernetes.config.config_exception import ConfigException

def load_kube_context():
    """Load Kubernetes configuration for accessing the cluster."""
    try:
        config.load_kube_config()
    except ConfigException:
        config.load_incluster_config()

def escape_single_quotes(s):
    """Escape single quotes in a string for safe MySQL insertion."""
    return s.replace("'", "\\'")

def run_mysql_insert(
    namespace,
    pod,
    container,
    mysqldb_name,
    mysql_user,
    mysql_password,
    ip,
    service_type,
    auth_type,
    auth_json
):
    """Run a MySQL insert command in the specified pod."""

    query = (
        f"INSERT IGNORE INTO {mysqldb_name}.services "
        f"(ip, serviceType, authType, auth) VALUES ("
        f"'{ip}', "
        f"'{service_type}', "
        f"'{auth_type}', "
        f"'{escape_single_quotes(auth_json)}'"
        f");"
    )

    command = [
        "mysql", "-u", mysql_user, f"-p{mysql_password}",
        "-e", query
    ]

    core_v1 = client.CoreV1Api()
    try:
        ws = stream(
            core_v1.connect_get_namespaced_pod_exec,
            name=pod,
            namespace=namespace,
            container=container,
            command=command,
            stderr=True,
            stdin=False,
            stdout=True,
            tty=False,
            _preload_content=False  # Allows streaming access
        )

        stdout = ""
        stderr = ""

        while ws.is_open():
            ws.update(timeout=1)
            if ws.peek_stdout():
                stdout += ws.read_stdout()
            if ws.peek_stderr():
                stderr += ws.read_stderr()
        ws.close()

        rc = ws.returncode

        if rc != 0:
            return {
                "rc": False,
                "result": stderr.strip() or "Unknown error"
            }
        return {
            "rc": True,
            "result": stdout.strip()
        }

    except Exception as e:
    # Catching all to ensure MySQL errors or stream failures are handled
        return {
            "rc": False, 
            "result": str(e)
        }


def insert_idracs_to_mysql(
    namespace,
    pod,
    container,
    mysqldb_name,
    mysql_user,
    mysql_password,
    telemetry_idrac_list,
    service_type,
    auth_type,
    bmc_username,
    bmc_password,
    retries=3,
    delay=3,
):
    """Insert iDRAC IPs into MySQL database."""

    # Load Kubernetes context to access the cluster
    load_kube_context()
    auth_dict = {"username": bmc_username, "password": bmc_password}
    auth_json = json.dumps(auth_dict)
    results = []

    try:
        for ip in telemetry_idrac_list:
            for _ in range(retries):
                result = run_mysql_insert(
                    namespace=namespace,
                    pod=pod,
                    container=container,
                    mysqldb_name=mysqldb_name,
                    mysql_user=mysql_user,
                    mysql_password=mysql_password,
                    ip=ip,
                    service_type=service_type,
                    auth_type=auth_type,
                    auth_json=auth_json
                )
                if result.get("rc"):
                    msg = f"Successfully inserted iDRAC IP {ip} into MySQL."
                    results.append({"ip": ip, "changed": True, "msg": msg})
                    break
                time.sleep(delay)
            else:
                results.append({"ip": ip, "changed": False, \
                "msg": f"Failed after {retries} attempts: {msg}"})
        if not results:
            results.append({"ip": "unknown", "changed": False, \
            "msg": "No iDRAC IPs to insert."})
    except Exception as e:
        results.append({"ip": "unknown", "changed": False, \
        "msg": f"An error occurred: {str(e)}"})

    return results

def main():
    """Main function to execute the module logic."""
    module_args = {
        "telemetry_namespace": {"type": "str", "required": True},
        "idrac_podnames_ips": {"type": "dict", "required": True},
        "mysqldb_k8s_name": {"type": "str", "required": True},
        "mysqldb_name": {"type": "str", "required": True},
        "mysql_user": {"type": "str", "required": True, "no_log": True},
        "mysqldb_password": {"type": "str", "required": True, "no_log": True},
        "bmc_username": {"type": "str", "required": True, "no_log": True},
        "bmc_password": {"type": "str", "required": True, "no_log": True},
        "telemetry_idrac": {"type": "list", "elements": "str", "required": True},
        "service_type": {"type": "str", "required": True},
        "auth_type": {"type": "str", "required": True},
        "db_retries": {"type": "int", "required": False, "default": 3},
        "db_delay": {"type": "int", "required": False, "default": 3},
    }

    result = {
        "changed": False,
        "inserted_ips": {},
        "failed_ips": []
    }

    module = AnsibleModule(
        argument_spec=module_args,
        supports_check_mode=True
    )

    telemetry_namespace = module.params['telemetry_namespace']
    idrac_podnames_ips = module.params['idrac_podnames_ips']
    mysqldb_k8s_name = module.params['mysqldb_k8s_name']
    mysqldb_name = module.params['mysqldb_name']
    mysql_user = module.params['mysql_user']
    mysqldb_password = module.params['mysqldb_password']
    bmc_username = module.params['bmc_username']
    bmc_password = module.params['bmc_password']
    telemetry_idrac = module.params['telemetry_idrac']
    service_type = module.params['service_type']
    auth_type = module.params['auth_type']
    db_retries = module.params['db_retries']
    db_delay = module.params['db_delay']

    # For each pod in idrac_podnames,
    # fetch the working IP's from telemetry_idrac,
    # then insert them into the mysqldb
    try:
        for pod in idrac_podnames_ips:
            idrac_ips_of_pod = idrac_podnames_ips.get(pod, [])
            if not idrac_ips_of_pod:
                module.warn(f"No iDRAC IPs found for pod {pod}. Skipping.")
                continue
            working_idrac_ips = list(set(telemetry_idrac) & set(idrac_ips_of_pod))
            pod_results = insert_idracs_to_mysql(
                namespace=telemetry_namespace,
                pod=pod,
                container=mysqldb_k8s_name,
                mysqldb_name=mysqldb_name,
                mysql_user=mysql_user,
                mysql_password=mysqldb_password,
                telemetry_idrac_list=working_idrac_ips,
                service_type=service_type,
                auth_type=auth_type,
                bmc_username=bmc_username,
                bmc_password=bmc_password,
                retries=db_retries,
                delay=db_delay
            )
            result['inserted_ips'][pod] = pod_results
            success = False
            for r in pod_results:
                if r.get('changed'):
                    success = True
                else:
                    result['failed_ips'].append({
                        "pod": pod,
                        "ip": r.get("ip", "unknown"),
                        "msg": r.get("msg", "No message")
                    })

            if success:
                result['changed'] = True

        module.exit_json(**result)
    except Exception as e:
        module.fail_json(
            msg=f"An error occurred while inserting iDRAC IPs into MySQL: {str(e)}",
            results=result['inserted_ips'],
            failed_ips=result['failed_ips']
        )

if __name__ == '__main__':
    main()


================================================
FILE: common/library/modules/localrepo_metadata_manager.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

# pylint: disable=import-error,no-name-in-module
#!/usr/bin/python

from pathlib import Path
from ansible.module_utils.basic import AnsibleModule
from ansible.module_utils.local_repo.process_metadata import (
    handle_generate_metadata,
    handle_compare_data,
    handle_update_data
)
from ansible.module_utils.local_repo.config import ( metadata_rerun_file_path )


"""
localrepo_metadata_manager.py

This Ansible custom module manages local repository metadata by:
- Generating metadata based on software and repository configuration files.
- Comparing and updating metadata while ignoring specific keys.
- Appending metadata footers with timestamps and policy info.

It supports check mode and can conditionally update metadata only if changes are detected.
"""

def main():
    
    argument_spec = {
        "software_config_path": {"type": "str", "required": True},
        "localrepo_config_path": {"type": "str", "required": True},
        "output_file": {"type": "str", "required": True},
        "update_metadata": {"type": "bool", "default": False},
        "ignore_keys": {"type": "list", "elements": "str", "default": ["lastrun_timestamp"]},
        "sub_urls": {"type": "dict", "required": False, "default": {}}
    }
    module = AnsibleModule(
        argument_spec=argument_spec,
        supports_check_mode=True
    )

    sw_config = module.params["software_config_path"]
    repo_data = module.params["localrepo_config_path"]
    output_file = module.params["output_file"]
    ignore_keys = module.params['ignore_keys']
    update_flag = module.params["update_metadata"]
    sub_urls = module.params["sub_urls"] or None

    try:
        if not output_file or not Path(output_file).exists():
            policy_result = handle_generate_metadata(sw_config,repo_data,output_file,sub_urls)
            module.exit_json(changed=True, policy=policy_result, msg="Metadata generated")
        else:
            if not update_flag:
                policy_result = handle_generate_metadata(
                    sw_config,
                    repo_data,
                    metadata_rerun_file_path,
                    sub_urls
                )

                compare_output = handle_compare_data(
                    output_file,
                    metadata_rerun_file_path,
                    ignore_keys
                )
                same = compare_output.get('identical', False)
                module.exit_json(changed=not same, identical=same, msg="Compared metadata")
            else:
                update_result = handle_update_data(output_file,metadata_rerun_file_path,ignore_keys)
                module.exit_json(changed=update_result["changed"], diff=update_result["diff"])

    except Exception as e:
        module.fail_json(msg=str(e))

if __name__ == '__main__':
    main()


================================================
FILE: common/library/modules/parallel_file_copy.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

#!/usr/bin/python
# pylint: disable=import-error,no-name-in-module,line-too-long

"""
Ansible module for parallel copying of files.

Supports copying multiple source → destination pairs in parallel,
with logging, retries, and optional cleanup.
"""

import os
import shutil
import threading
from datetime import datetime
from concurrent.futures import ThreadPoolExecutor, as_completed
from ansible.module_utils.basic import AnsibleModule
from ansible.module_utils.local_repo.standard_logger import setup_standard_logger

# ============================================================
# Default Values
# ============================================================

DEFAULT_MAX_WORKERS = 4
DEFAULT_RETRY_COUNT = 2
DEFAULT_DELETE_EXISTING = True
PARALLEL_FILE_COPY_LOG = '/opt/omnia/log/core/playbooks/parallel_file_copy.log/'

# ============================================================
# Copy Worker Function
# ============================================================

def copy_single_file(src_file, dest_dir, retry_count, delete_existing, slogger, summary):
    """Copy one directory pair with retry support."""
    thread_name = threading.current_thread().name
    start_time = datetime.now()

    if not os.path.isfile(src_file):
        slogger.info(f"NOT COPIED - Source file missing: {src_file}")
        summary["skipped"].append(src_file)
        return

    os.makedirs(dest_dir, exist_ok=True)
    dest_file = os.path.join(dest_dir, os.path.basename(src_file))

    for attempt in range(1, retry_count + 1):
        try:
            slogger.info(f"[{thread_name}] START {start_time} Copying {src_file} (Attempt {attempt})")

            if delete_existing and os.path.exists(dest_file):
                os.remove(dest_file)
                slogger.info(f"Deleted existing file: {dest_file}")

            shutil.copy2(src_file, dest_file)

            end_time = datetime.now()
            duration = (end_time - start_time).total_seconds()
            slogger.info(f"[{thread_name}] SUCCESS {end_time} Copied {src_file} -> {dest_file} (Duration={duration:.2f}s)")

            summary["copied"].append(src_file)
            return

        except Exception as err:
            slogger.error(f"[{thread_name}] ERROR copying {src_file} (Attempt {attempt}) Reason: {err}")
            if attempt == retry_count:
                summary["failed"].append(src_file)

# ============================================================
# Main Parallel Copy Logic
# ============================================================

def execute_parallel_copy(module, copy_pairs, max_workers, retry_count, delete_existing, slogger):
    """
    Executes parallel copy for all pairs.
    Returns summary dict.
    """
    summary = {"copied": [], "skipped": [], "failed": []}
    futures = []

    slogger.info("===== PARALLEL FILE COPY STARTED =====")
    slogger.info(f"Copy pairs received: {copy_pairs}")
    slogger.info(f"Max workers: {max_workers}")

    with ThreadPoolExecutor(max_workers=max_workers) as executor:
        for src_dir, dest_dir in copy_pairs:

            if not os.path.isdir(src_dir):
                slogger.info(f"NOT COPIED - Source directory missing: {src_dir}")
                summary["skipped"].append(src_dir)
                continue

            files = [os.path.join(src_dir, f) for f in os.listdir(src_dir) if os.path.isfile(os.path.join(src_dir, f))]
            if not files:
                slogger.info(f"NOT COPIED - No files found in directory: {src_dir}")
                summary["skipped"].append(src_dir)
                continue

            # ⚡ Show Ansible warning for in-progress copy
            module.warn(f"Copy in progress for {src_dir} -> {dest_dir}. Please wait ...")

            slogger.info(f"Copying {len(files)} files from {src_dir} -> {dest_dir} ...")

            for file_path in files:
                futures.append(executor.submit(copy_single_file, file_path, dest_dir, retry_count, delete_existing, slogger, summary))

        # Wait for all copies to finish
        for future in as_completed(futures):
            future.result()

    slogger.info("===== PARALLEL FILE COPY FINISHED =====")
    return summary

# ============================================================
# Ansible Module Entry Point
# ============================================================

def main():
    """Main Ansible module execution entrypoint."""
    module_args = dict(
        copy_pairs=dict(type="list", required=True),
        max_workers=dict(type="int", required=False, default=DEFAULT_MAX_WORKERS),
        retry_count=dict(type="int", required=False, default=DEFAULT_RETRY_COUNT),
        delete_existing=dict(type="bool", required=False, default=DEFAULT_DELETE_EXISTING),
        slog_file=dict(type="str", required=False, default=PARALLEL_FILE_COPY_LOG),
    )

    module = AnsibleModule(argument_spec=module_args, supports_check_mode=True)

    copy_pairs = module.params["copy_pairs"]
    max_workers = module.params["max_workers"]
    retry_count = module.params["retry_count"]
    delete_existing = module.params["delete_existing"]
    slog_file = module.params["slog_file"]

    slogger = setup_standard_logger(slog_file)

    result = dict(changed=False, copied=[], skipped=[], failed=[])

    try:
        summary = execute_parallel_copy(module, copy_pairs, max_workers, retry_count, delete_existing, slogger)

        result["copied"] = summary["copied"]
        result["skipped"] = summary["skipped"]
        result["failed"] = summary["failed"]
        if summary["copied"]:
            result["changed"] = True

        overall_status = "SUCCESS"
        if summary["failed"] and summary["copied"]:
            overall_status = "PARTIAL"
        elif summary["failed"] and not summary["copied"]:
            overall_status = "FAILURE"

        result["overall_status"] = overall_status
        module.exit_json(**result)

    except Exception as err:
        slogger.error(f"Parallel copy execution failed: {err}")
        module.fail_json(msg=str(err), **result)

if __name__ == "__main__":
    main()


================================================
FILE: common/library/modules/parallel_tasks.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

#!/usr/bin/python
# pylint: disable=import-error,no-name-in-module
import os
import re
from datetime import datetime
from prettytable import PrettyTable
from collections import defaultdict
from ansible.module_utils.basic import AnsibleModule
from ansible.module_utils.local_repo.process_parallel import execute_parallel, log_table_output
from ansible.module_utils.local_repo.download_common import (
    process_manifest,
    process_tarball,
    process_git,
    process_shell,
    process_ansible_galaxy_collection,
    process_iso,
    process_pip,
    process_rpm_file
)
from ansible.module_utils.local_repo.download_image import process_image
from ansible.module_utils.local_repo.download_rpm import process_rpm
from ansible.module_utils.local_repo.standard_logger import setup_standard_logger
from ansible.module_utils.local_repo.common_functions import (
    generate_vault_key, process_file, is_encrypted
)
from ansible.module_utils.local_repo.software_utils import (
    load_json,
    set_version_variables,
    get_subgroup_dict
)
from ansible.module_utils.local_repo.config import (
    DEFAULT_NTHREADS,
    DEFAULT_TIMEOUT,
    LOG_DIR_DEFAULT,
    DEFAULT_LOG_FILE,
    DEFAULT_SLOG_FILE,
    CSV_FILE_PATH_DEFAULT,
    DEFAULT_REPO_STORE_PATH,
    USER_JSON_FILE_DEFAULT,
    DEFAULT_STATUS_FILENAME,
    SOFTWARE_CSV_FILENAME,
    SOFTWARE_CSV_HEADER,
    STATUS_CSV_HEADER,
    LOCAL_REPO_CONFIG_PATH_DEFAULT,
    OMNIA_CREDENTIALS_YAML_PATH,
    OMNIA_CREDENTIALS_VAULT_PATH
)

def update_status_csv(csv_dir, software, overall_status,slogger):
    """
    Update the status CSV file with the status for given software.

    If the software already exists, update its status.
    If 'software' is a list, update each software with the same overall_status.

    Args:
        csv_dir (str): Directory path where the CSV file resides.
        software (str or list): Software name(s) to update.
        overall_status (str): The overall status to record.
        slogger (logging.Logger): Logger instance for structured logging.
    """

    slogger.info("Starting CSV status update process")
    parent_dir = os.path.dirname(csv_dir)
    status_file = os.path.join(parent_dir, SOFTWARE_CSV_FILENAME)
    #header = "name,status"
    header = SOFTWARE_CSV_HEADER

    # Create the file with header if it does not exist.
    if not os.path.exists(status_file):
        slogger.info("Status file not found. Creating new file with header.")
        with open(status_file, "w", encoding="utf-8") as f:
            f.write(header + "\n")

    # Read the existing file content.
    slogger.info("Reading existing CSV content")
    with open(status_file, "r", encoding="utf-8") as f:
        lines = f.read().splitlines()

    # Ensure there is a header.
    if not lines or lines[0] != header:
        lines.insert(0, header)

    # Build a dictionary for existing entries (skip header).
    status_dict = {}
    for line in lines[1:]:
        parts = line.split(',')
        if len(parts) >= 2:
            key = parts[0].strip()
            value = parts[1].strip()
            status_dict[key] = value

    # Transform the new status.
    transformed_status = re.sub(r'failure', 'failed', overall_status.lower())
    transformed_status = re.sub(r'timeout', 'failed', transformed_status)

    # Update or add the entry for each given software.
    if isinstance(software, list):
        for sw in software:
            status_dict[sw] = transformed_status
    else:
        status_dict[software] = transformed_status

    # Recreate the CSV content.
    final_lines = [header]
    for key, value in status_dict.items():
        final_lines.append(f"{key},{value}")

    # Write the updated content back to the file.
    with open(status_file, "w", encoding="utf-8") as f:
        f.write("\n".join(final_lines))

    slogger.info(f"Successfully updated status CSV at {status_file}")


def determine_function(
    task, repo_store_path, csv_file_path, user_data, version_variables, arc,
    user_registries, docker_username, docker_password
):
    """
    Determines the appropriate function and its arguments to process a given task.

    Args:
        task (dict): A dictionary containing information about the task to be processed.
        repo_store_path (str): The path to the repository store.
        csv_file_path (str): The path to the CSV file.
        user_data (dict): A dictionary containing user data.
        version_variables (dict): A dictionary containing version variables.
        arc (str): Architecture of package to be downloaded

    Returns:
        tuple: A tuple containing the function to process the task and its arguments.

    Raises:
        ValueError: If the task type is unknown.
        RuntimeError: If an error occurs while determining the function.
    """
    try:
        # Ensure the CSV directory exists.
        os.makedirs(csv_file_path, exist_ok=True)
        cluster_os_type = user_data['cluster_os_type']
        cluster_os_version = user_data['cluster_os_version']
        repo_config_value = user_data.get("repo_config")

        # Construct the status file path using DEFAULT_STATUS_FILENAME.
        status_file = os.path.join(csv_file_path, DEFAULT_STATUS_FILENAME)
        if not os.path.exists(status_file) or os.stat(status_file).st_size == 0:
            with open(status_file, 'w', encoding="utf-8") as file:
                file.write(STATUS_CSV_HEADER)


        task_type = task.get("type")
        if task_type == "manifest":
            return process_manifest, [
                task, repo_store_path, status_file, cluster_os_type,
                cluster_os_version, arc
            ]
        if task_type == "git":
            return process_git, [
                task, repo_store_path, status_file, cluster_os_type,
                cluster_os_version, arc
            ]
        if task_type == "tarball":
            return process_tarball, [
                task, repo_store_path, status_file, version_variables,
                cluster_os_type, cluster_os_version, arc
            ]
        if task_type == "shell":
            return process_shell, [
                task, repo_store_path, status_file, cluster_os_type,
                cluster_os_version, arc
            ]
        if task_type == "ansible_galaxy_collection":
            return process_ansible_galaxy_collection, [
                task, repo_store_path, status_file, cluster_os_type,
                cluster_os_version, arc
            ]
        if task_type == "iso":
            return process_iso, [
                task, repo_store_path, status_file, cluster_os_type,
                cluster_os_version, version_variables, arc
            ]
        if task_type == "pip_module":
            return process_pip, [
                task, repo_store_path, status_file, cluster_os_type,
                cluster_os_version, arc
            ]
        if task_type == "image":
            return process_image, [
                task, status_file, version_variables, user_registries,
                docker_username, docker_password
            ]
        if task_type == "rpm_file":
            return process_rpm_file, [
                task, repo_store_path, status_file, cluster_os_type,
                cluster_os_version, arc
            ]
        if task_type in ("rpm", "rpm_repo"):
            return process_rpm, [
                task, repo_store_path, status_file, cluster_os_type,
                cluster_os_version, repo_config_value, arc
            ]

        raise ValueError(f"Unknown task type: {task_type}")
    except Exception as e:
        raise RuntimeError(f"Failed to determine function for task: {str(e)}")


def generate_pretty_table(task_results, total_duration, overall_status,slogger):
    """
    Generates a pretty table with the task results, total duration, and overall status.

    Args:
        task_results (list): A list of dictionaries containing the task results.
        total_duration (str): The total duration of the tasks.
        overall_status (str): The overall status of the tasks.
        slogger (logging.Logger): Logger instance for structured logging.

    Returns:
        str: The pretty table as a string.
    """
    try:
        slogger.info("Starting generation of task results pretty table")

        if not task_results or not isinstance(task_results, list):
            slogger.error("Invalid or empty task_results provided")
            return "No task results available."

        slogger.info(f"Received {len(task_results)} task results for table generation")

        table = PrettyTable(["Task", "Status", "LogFile"])
        for result in task_results:
            table.add_row([result["package"], result["status"], result["logname"]])
        table.add_row(["Total Duration", total_duration, ""])
        table.add_row(["Overall Status", overall_status, ""])
        return table.get_string()

        slogger.info("Task results table generated successfully")

    except Exception as e:
        slogger.error(f"Error occurred while generating pretty table: {e}")
        return f"Error: {e}"

def generate_software_status_table(status_dict,slogger):
    """
    Returns status tables of software grouped by architecture.

    Args:
        status_dict (dict): Software info with 'arch' and 'overall_status' for each entry.
        slogger (logging.Logger): Logger instance for structured logging.

    Returns:
        str: Formatted tables (per arch) showing software name and status.
    """
    try:
        slogger.info("Starting generation of software status table")
        grouped = defaultdict(list)

        # status_dict is expected to have software names as keys, list of dicts as values
        slogger.info("Grouping software entries by architecture")
        for software_name, entries in status_dict.items():
            for info in entries:
                arch = info.get("arch", "unknown")
                status = info.get("overall_status", "unknown")
                grouped[arch].append((software_name, status))

        # Build tables for each arch
        tables = []
        for arch, items in grouped.items():
            slogger.info(f"Creating table for architecture: {arch}")
            table = PrettyTable()
            table.title = f"{arch} Software Stack Download Overview"
            table.field_names = ["Name", "Status"]
            for name, status in items:
                table.add_row([name, status.lower()])

            tables.append(table.get_string())
            slogger.info(f"Completed table for {arch}")

        slogger.info("Software status table generation completed successfully")
        return "\n\n".join(tables)

    except Exception as e:
        slogger.error(f"Error occurred while generating software status table: {e}")
        return f"Error: {e}"

def main():
    """
    Executes a list of tasks in parallel using multiple worker processes.

    Args:
        tasks (list): A list of tasks (dictionaries) that need to be processed in parallel.
        nthreads (int): The number of worker processes to run in parallel.
        timeout (int): The maximum time allowed for all tasks to execute.
                    If `None`, no timeout is enforced.
        log_dir (str): The directory where log files for the worker processes will be saved.
        log_file (str): The path to the log file for the overall task execution.
        slog_file (str): The path to the log file for the standard logger.
        csv_file_path (str): The path to a CSV file that may be needed for processing some tasks.
        repo_store_path (str): The path to the repository where task-related files are stored.
        software (list): A list of software names.
        user_json_file (str): The path to the JSON file containing user data.
        show_softwares_status (bool): Whether to display the software status;
                                optional, defaults to False.
        overall_status_dict (dict): A dictionary containing overall software status
                                information; optional, defaults to an empty dict.
            Dictionary containing software status information grouped by software names.
            Each key (e.g., 'service_k8s') maps to a list of dictionaries,
            where each dictionary contains:
                - 'arch' (str): Architecture name, e.g., 'x86_64' or 'aarch64'.
                - 'overall_status' (str): Status of the software on that architecture,
                                        e.g., 'SUCCESS'.
            Example:
                {
                    "service_k8s": [
                        {"arch": "x86_64", "overall_status": "SUCCESS"},
                        {"arch": "aarch64", "overall_status": "SUCCESS"}
                    ]
                }
            Defaults to an empty dict if not provided.

    Returns:
        tuple: A tuple containing:
            - overall_status (str): The overall status of task execution
                                 ("SUCCESS", "FAILED", "PARTIAL", "TIMEOUT").
            - task_results_data (list): A list of dictionaries, each containing
                                    the result of an individual task.
    Raises:
        Exception: If an error occurs during execution.
    """

    module_args = {
        "tasks": {"type": "list", "required": True},
        "nthreads": {"type": "int", "required": False, "default": DEFAULT_NTHREADS},
        "timeout": {"type": "int", "required": False, "default": DEFAULT_TIMEOUT},
        "log_dir": {"type": "str", "required": False, "default": LOG_DIR_DEFAULT},
        "log_file": {"type": "str", "required": False, "default": DEFAULT_LOG_FILE},
        "slog_file": {"type": "str", "required": False, "default": DEFAULT_SLOG_FILE},
        "csv_file_path": {"type": "str", "required": False, "default": CSV_FILE_PATH_DEFAULT},
        "repo_store_path": {"type": "str", "required": False, "default": DEFAULT_REPO_STORE_PATH},
        "software": {"type": "list", "elements": "str", "required": True},
        "user_json_file": {"type": "str", "required": False, "default": USER_JSON_FILE_DEFAULT},
        "show_softwares_status": {"type": "bool", "required": False, "default": False},
        "overall_status_dict": {"type": "dict","required": True},
        "local_repo_config_path": {
            "type": "str", "required": False,
            "default": LOCAL_REPO_CONFIG_PATH_DEFAULT
        },
        "arch": {"type": "str", "required": False},
        "omnia_credentials_yaml_path": {
            "type": "str", "required": False,
            "default": OMNIA_CREDENTIALS_YAML_PATH
        },
        "omnia_credentials_vault_path": {
            "type": "str", "required": False,
            "default": OMNIA_CREDENTIALS_VAULT_PATH
        }
    }
    module = AnsibleModule(argument_spec=module_args, supports_check_mode=True)
    tasks = module.params["tasks"]
    nthreads = module.params["nthreads"]
    log_dir = module.params["log_dir"]
    log_file = module.params["log_file"]
    slog_file = module.params["slog_file"]
    timeout = module.params["timeout"]
    csv_file_path = module.params["csv_file_path"]
    repo_store_path = module.params["repo_store_path"]
    software = module.params["software"]
    user_json_file = module.params["user_json_file"]
    show_softwares_status = module.params["show_softwares_status"]
    overall_status_dict = module.params["overall_status_dict"]
    local_repo_config_path = module.params["local_repo_config_path"]
    arc = module.params["arch"]
    # user_reg_cred_input = module.params["user_reg_cred_input"]
    # user_reg_key_path = module.params["user_reg_key_path"]
    omnia_credentials_yaml_path = module.params["omnia_credentials_yaml_path"]
    omnia_credentials_vault_path = module.params["omnia_credentials_vault_path"]

    # Initialize standard logger.
    slogger = setup_standard_logger(slog_file)
    result = {"changed": False, "task_results": []}
    # Record start time.
    start_time = datetime.now()
    formatted_start_time = start_time.strftime("%I:%M:%S %p")
    slogger.info(f"Start execution time: {formatted_start_time}")
    slogger.info(f"Task list: {tasks}")
    slogger.info(f"Number of threads: {nthreads}")
    slogger.info(f"Timeout: {timeout}")
    slogger.info(f"overall_status_dict: {overall_status_dict}")
    slogger.info(f"show_softwares_status: {show_softwares_status}")

    # Check if the flag to show software status is enabled
    if show_softwares_status:
        # Generate a formatted status table from the overall_status_dict parameter
        status_table = generate_software_status_table(overall_status_dict,slogger)
        module.exit_json(changed=False, msg=status_table)

    try:
        user_data = load_json(user_json_file)
        cluster_os_type = user_data['cluster_os_type']
        cluster_os_version = user_data['cluster_os_version']

        subgroup_dict, software_names = get_subgroup_dict(user_data, slogger)
        version_variables = set_version_variables(
            user_data, software_names, cluster_os_version, slogger
        )
        slogger.info(f"Cluster OS: {cluster_os_type}")
        slogger.info(f"Version Variables: {version_variables}")
        # gen_result = {}
        # if not os.path.isfile(user_reg_key_path):
        #     gen_result = generate_vault_key(user_reg_key_path)
        # if gen_result is None:
        #     module.fail_json(
        #         msg=f"Unable to generate local_repo key at path: {user_reg_key_path}"
        #     )

        overall_status, task_results = execute_parallel(
            tasks, determine_function, nthreads, repo_store_path, csv_file_path,
            log_dir, user_data, version_variables, arc, slogger,
            local_repo_config_path, omnia_credentials_yaml_path,
            omnia_credentials_vault_path, timeout
        )

        # if not is_encrypted(user_reg_cred_input):
        #     process_file(user_reg_cred_input, user_reg_key_path, 'encrypt')

        end_time = datetime.now()
        formatted_end_time = end_time.strftime("%I:%M:%S %p")
        total_seconds = (end_time - start_time).total_seconds()
        minutes, seconds = divmod(int(total_seconds), 60)
        total_duration = f"{minutes} min {seconds} sec" if minutes > 0 else f"{seconds} sec"

        slogger.info(f"End execution time: {formatted_end_time}")
        slogger.info(f"Total execution time: {total_duration}")
        slogger.info(f"Task results: {task_results}")

        table_output = generate_pretty_table(task_results, total_duration, overall_status,slogger)
        log_table_output(table_output, log_file)
        result["total_duration"] = total_duration
        result["task_results"] = task_results
        result["table_output"] = table_output
        result["arch"] = arc

        update_status_csv(csv_file_path, software, overall_status, slogger)

        if overall_status == "SUCCESS":
            result["overall_status"] = "SUCCESS"
            result["changed"] = True
            slogger.info(f"Result: {result}")
            module.exit_json(**result)
        elif overall_status == "PARTIAL":
            result["overall_status"] = "PARTIAL"
            module.exit_json(msg="Some tasks partially failed", **result)
        else:
            result["overall_status"] = "FAILURE"
            module.exit_json(msg="Some tasks failed", **result)

    except RuntimeError as e:
        slogger.error(f"Execution failed: {str(e)}")
        module.fail_json(msg=f"Error during execution: {str(e)}", **result)


    except Exception as e:
        result["table_output"] = (
            table_output if "table_output" in locals() else "No table generated."
        )
        slogger.error(f"Execution failed: {str(e)}")
        module.fail_json(msg=f"Error during execution: {str(e)}", **result)

if __name__ == "__main__":
    main()


================================================
FILE: common/library/modules/prepare_tasklist.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

# pylint: disable=import-error,no-name-in-module,too-many-locals,too-many-statements
#!/usr/bin/python

import os
from datetime import datetime
from ansible.module_utils.basic import AnsibleModule
from ansible.module_utils.local_repo.standard_logger import setup_standard_logger
from ansible.module_utils.local_repo.software_utils  import (
    get_software_names_and_arch,
    check_csv_existence,
    get_failed_software,
    get_csv_file_path,
    get_csv_software,
    process_software,
    load_json,
    load_yaml,
    get_json_file_path,
    transform_package_dict,
    parse_repo_urls,
    set_version_variables,
    get_subgroup_dict,
    get_new_packages_not_in_status,
    remove_duplicates_from_trans,
    parse_additional_repos,
    validate_additional_repos_names
)

# Import configuration constants individually (excluding fresh_installation_status)
from ansible.module_utils.local_repo.config import (
    CSV_FILE_PATH_DEFAULT,
    USER_JSON_FILE_DEFAULT,
    LOG_DIR_DEFAULT,
    LOCAL_REPO_CONFIG_PATH_DEFAULT,
    SOFTWARE_CSV_FILENAME,
    ARCH_SUFFIXES
)

def main():
    """
    Prepares package lists and processes software based on user and repository configurations.

    This function initializes the module arguments and logger. It loads user data from a JSON file
    and repository configuration from a YAML file, retrieves cluster OS details, and determines the list
    of software. It then computes a boolean flag for fresh installation based on the CSV file's existence.
    For new software, the flag is enforced to True. The software is then processed, and the package tasks
    are aggregated and returned.
    """

    module_args = {
        "csv_file_path": {"type": "str", "required": False, "default": CSV_FILE_PATH_DEFAULT},
        "user_json_file": {"type": "str", "required": False, "default": USER_JSON_FILE_DEFAULT},
        "local_repo_config_path": {"type": "str", "required": False, "default": LOCAL_REPO_CONFIG_PATH_DEFAULT},
        "log_dir": {"type": "str", "required": False, "default": LOG_DIR_DEFAULT},
        "key_path": {"type": "str", "required": True},
        "sub_urls": {"type": "dict","required": False,"default": {}}

    }

    module = AnsibleModule(argument_spec=module_args)
    log_dir = module.params["log_dir"]
    user_json_file = module.params["user_json_file"]
    csv_file_path = module.params["csv_file_path"]
    local_repo_config_path = module.params["local_repo_config_path"]
    vault_key_path = module.params["key_path"]
    sub_urls =  module.params["sub_urls"]
    logger = setup_standard_logger(log_dir)
    start_time = datetime.now().strftime("%I:%M:%S %p")
    logger.info(f"Start execution time: {start_time}")

    try:
        user_data = load_json(user_json_file)
        cluster_os_type = user_data['cluster_os_type']
        cluster_os_version = user_data['cluster_os_version']
        repo_config = user_data['repo_config']

        final_tasks_dict = {}
        for arch in ARCH_SUFFIXES:
            software_csv_path = {}
            fresh_installation = {}
            software_list = {}
            csv_softwares = {}
            new_softwares = {}
            software_dict = {}
            json_path = {}
            status_csv_path = {}
            failed_softwares = []
            new_pkg_dict = {}
            tasks_dict = {}

            full_path = os.path.join(csv_file_path, arch, SOFTWARE_CSV_FILENAME)
            fresh_installation[arch] = True if not check_csv_existence(full_path) else False
            software_csv_path[arch] = full_path
            logger.info(f"sub rhel urls : {sub_urls}")
            logger.info(f"fresh_installation dict: {fresh_installation}")
            logger.info(f"software_csv_path: {software_csv_path}")
            software_list[arch] = get_software_names_and_arch(user_data,arch)
            logger.info(f"software_list: {software_list}")
            if not fresh_installation[arch]:
                csv_softwares[arch] = get_csv_software(software_csv_path[arch])
                new_softwares[arch] = [
                   software for software in software_list[arch] if software not in csv_softwares[arch]
                ]
            logger.info(f"Existing softwares in {arch} software csv: {csv_softwares}")
            logger.info(f"New software list for {arch}: {new_softwares}")
            # Build a dictionary mapping software names to subgroup data, if available
            subgroup_dict, software_names = get_subgroup_dict(user_data,logger)
            version_variables = set_version_variables(user_data, software_names, cluster_os_version,logger)

            logger.info("Preparing package lists...")
            for software in software_list[arch]:
                logger.info(f"Processing software: {software}")
                json_path[arch] = get_json_file_path(software, cluster_os_type,
                                                    cluster_os_version, user_json_file, arch)
                status_csv_path[arch] = get_csv_file_path(software, log_dir, arch)
                logger.info(f"json_path: {json_path}")
                logger.info(f"status_csv_path: {status_csv_path}")
                if not json_path[arch]:
                    logger.warning(f"Skipping {software}: JSON path does not exist.")
                    continue
                if not fresh_installation[arch]:
                    is_fresh_software = software in new_softwares.get(arch, [])
                else:
                    is_fresh_software = True
                logger.info(f"is_fresh_software: {is_fresh_software}")
                failed_softwares = get_failed_software(software_csv_path[arch])
                logger.info(f"failed softwares: {failed_softwares}")
                tasks, failed_packages = process_software(software, is_fresh_software, json_path[arch],
                                                           status_csv_path[arch],
                                                           subgroup_dict.get(software, None),logger)
                logger.info(f"tasks to be processed: {tasks}")
                logger.info(f"failed_packages : {failed_packages}")

                if not is_fresh_software:
                    pkgs = get_new_packages_not_in_status(json_path[arch],
                                                          status_csv_path[arch],
                                                          subgroup_dict.get(software, None),logger)

                    if pkgs:
                        logger.info(f"Additional software packages for {software}: {pkgs}")
                        tasks.extend(pkgs)

                if tasks:
                    tasks_dict[software] = tasks
                    trans=transform_package_dict(tasks_dict, arch,logger)
                    trans = remove_duplicates_from_trans(trans)
                    logger.info(f"Final tasklist to process: {trans}")
                    final_tasks_dict.update(trans)
        sw_archs = list(set(
            arch for sw in user_data.get("softwares", [])
            for arch in sw.get("arch", [])
        ))
        logger.info(f"Unique architectures from software_config: {sw_archs}")
        local_config, url_result = parse_repo_urls(repo_config, local_repo_config_path, version_variables, vault_key_path, sub_urls, logger, sw_archs)
        if not url_result:
            module.fail_json(f"{local_config} is either unreachable, invalid or has incorrect SSL certificates, please verify and provide correct details")

        # Validate additional_repos names for conflicts
        is_valid, error_msg = validate_additional_repos_names(local_repo_config_path, logger)
        if not is_valid:
            module.fail_json(msg=error_msg)

        # Parse additional_repos for aggregated repos feature
        additional_repos_config, error_msg = parse_additional_repos(
            local_repo_config_path, repo_config, vault_key_path, logger
        )
        if error_msg:
            module.fail_json(msg=error_msg)

        logger.info(f"Package processing completed: {final_tasks_dict}")
        module.exit_json(changed=False, software_dict=final_tasks_dict, local_config=local_config, additional_repos_config=additional_repos_config, sw_archs=sw_archs)

    except Exception as e:
        logger.error(f"Error occurred: {str(e)}")
        module.fail_json(msg=str(e))

if __name__ == "__main__":
    main()


================================================
FILE: common/library/modules/process_rpm_config.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

#!/usr/bin/python
# pylint: disable=import-error,no-name-in-module
import subprocess
import multiprocessing
import os
import re
import shlex
from datetime import datetime
from functools import partial
import time
import json

import requests
from ansible.module_utils.basic import AnsibleModule
from ansible.module_utils.local_repo.standard_logger import setup_standard_logger
from ansible.module_utils.local_repo.config import (
    pulp_rpm_commands,
    AGGREGATED_REPO_NAME_TEMPLATE,
    AGGREGATED_REMOTE_NAME_TEMPLATE,
    AGGREGATED_DISTRIBUTION_NAME_TEMPLATE,
    AGGREGATED_BASE_PATH_TEMPLATE,
    PULP_CONCURRENCY
)

def validate_command_input(value):
    """
    Validates input values to prevent command injection.

    Args:
        value (str): The input value to validate.

    Returns:
        bool: True if the value is safe, False if it contains dangerous characters.

    Raises:
        ValueError: If the value contains shell metacharacters that could enable command injection.
    """
    if value is None:
        return True

    value_str = str(value)
    # Pattern to detect shell metacharacters that could enable command injection
    dangerous_pattern = re.compile(r'[;&|`$(){}\[\]<>\n\r\\]|\$\(')

    if dangerous_pattern.search(value_str):
        raise ValueError(f"Invalid input: contains potentially dangerous characters: {value_str}")

    return True


def validate_pulp_href(href):
    """
    Validates that a Pulp href matches the expected format and returns a sanitized copy.
    This is an allowlist validation to prevent argument injection.

    Args:
        href (str): The Pulp href to validate.

    Returns:
        str: A sanitized href reconstructed from validated components.

    Raises:
        ValueError: If the href does not match the expected Pulp API format.
    """
    if href is None:
        return None

    href_str = str(href)
    # Pulp hrefs follow pattern: /pulp/api/v<version>/<resource_type>/<uuid>/
    # Example: /pulp/api/v3/publications/rpm/rpm/01234567-89ab-cdef-0123-456789abcdef/
    # Pattern uses v\d+ to support future API versions (v3, v4, v5, etc.)
    # Capturing groups are used to reconstruct the href, breaking the taint chain
    pulp_href_pattern = re.compile(r'^(/pulp/api/v)(\d+)(/[a-zA-Z0-9/_-]+)([a-f0-9-]{36})(/)$')

    match = pulp_href_pattern.match(href_str)
    if not match:
        raise ValueError(f"Invalid Pulp href format: {href_str}")

    # Reconstruct href from captured groups - this creates a new untainted string
    # Then apply shlex.quote to sanitize for shell safety (recognized sanitizer)
    sanitized_href = "".join(match.groups())
    # Remove quotes added by shlex.quote since we're using argument list (not shell)
    # shlex.quote adds quotes around the string which we need to strip
    quoted = shlex.quote(sanitized_href)
    # shlex.quote returns the string with quotes if it contains special chars,
    # or the original string if safe. Since our regex only allows safe chars,
    # it should return the same string, but this marks it as sanitized for Checkmarx
    return quoted.strip("'")


def execute_command(cmd_string, log,type_json=None, seconds=None):
    """
    Executes a shell command and returns its output.

    Args:
        cmd_string (str): The shell command to execute.
        log (logging.Logger): Logger instance for logging the process and errors.
        type_json (bool, optional): If set to `True`, the function will attempt to parse the
        command's output as JSON.
        seconds (float, optional): The maximum time allowed for the command to execute. If `None`,
        no timeout is enforced.

    Returns:
        str or bool: Returns the command's output as a string, or `False` if the command failed.
    """

    try:
        log.info("Executing Command: %s", cmd_string)
        # Use shlex.split to safely parse the command string into a list of arguments
        # This prevents command injection by avoiding shell=True
        cmd_list = shlex.split(cmd_string)
        cmd = subprocess.run(cmd_list, universal_newlines=True, stdout=subprocess.PIPE, stderr=subprocess.PIPE, timeout=seconds, shell=False)
        log.info(f"execute command return code : {cmd}")
        if cmd.returncode != 0:
            return False
        if type_json:
            return json.loads(cmd.stdout)
        return True
    except Exception as e:
        log.error("Exception while executing command: %s", str(e))
        return False

def check_repository_synced(repo_name, log):
    """
    Check if repository has synced content using Pulp CLI.

    Parameters:
        repo_name (str): The name of the repository.
        log (logging.Logger): The logger object.

    Returns:
        bool: True if repository has synced packages, False otherwise.
    """
    try:
        result = subprocess.run(
            ["pulp", "rpm", "repository", "show", "--name", repo_name],
            capture_output=True, text=True, check=True
        )
        repo_info = json.loads(result.stdout)
        latest_version_href = repo_info.get("latest_version_href", "")

        # Check if version > 0 (version 0 is empty initial state)
        if latest_version_href and not latest_version_href.endswith("/versions/0/"):
            log.info(f"{repo_name} already synced. Skipping sync.")
            return True

        log.info(f"{repo_name} not synced yet. Proceeding with sync.")
        return False
    except subprocess.CalledProcessError:
        log.info(f"Repository {repo_name} does not exist. Proceeding.")
        return False
    except Exception as e:
        log.error(f"Error checking repository: {e}")
        return False

def create_rpm_repository(repo,log):
    """
    Create an RPM repository if it doesn't already exist.

    Args:
        repo (dict): A dictionary containing the package information.
        log (logging.Logger): Logger instance for logging the process and errors.

    Returns:
        bool: True if the repository was created successfully or already exists, False if there was an error.
    """
    try:
        repo_name = repo["package"]
        version = repo.get("version")

        if version != "null":
            repo_name = f"{repo_name}_{version}"
        if not show_rpm_repository(repo_name,log):
            command = pulp_rpm_commands["create_repository"] % repo_name
            log.info("Repository '%s' does not exist. Executing command: %s", repo_name, command)
            result = execute_command(command,log)
            log.info("Repository %s created.", repo_name)
            return result, repo_name

        log.info("Repository %s already exists.", repo_name)
        return True, repo_name

    except Exception as e:
        log.error("Unexpected error while creating repository '%s': %s", repo.get('package', 'unknown'), e)
        return False, repo.get("package", "unknown")

def show_rpm_repository(repo_name,log):
    """
    Show details of an RPM repository.

    Args:
        repo_name (str): The name of the repository.
        log (logging.Logger): Logger instance for logging the process and errors.

    Returns:
        bool: True if the repository was found, False otherwise.
    """

    try:
        log.info("Checking existence of RPM repository: '%s'", repo_name)
        command = pulp_rpm_commands["show_repository"] % repo_name
        log.info("Executing command to show repository: %s", command)

        return execute_command(command,log)

    except Exception as e:
        log.error("Unexpected error while checking repository '%s': %s", repo_name, str(e))
        return False

def create_rpm_remote(repo,log):
    """
    Create a remote for the RPM repository if it doesn't already exist.

    Args:
        repo (dict): A dictionary containing the repository information.
        log (logging.Logger): Logger instance for logging the process and errors.

    Returns:
        bool: True if the remote was created or updated successfully, False otherwise.
    """

    try:
        log.info("Starting RPM remote creation process")
        remote_url = repo["url"]
        policy_type = repo["policy"]
        version = repo.get("version")
        repo_name = repo["package"]
        result = None

        if version != "null":
            repo_name = f"{repo_name}_{version}"

        remote_name = repo_name
    
        # Check if remote already exists - skip if it does
        if show_rpm_remote(remote_name, log):
            log.info("Remote '%s' already exists. Skipping.", remote_name)
            return True, repo_name
        
        # Remote doesn't exist - create it
        repo_keys = repo.keys()
        if "ca_cert" in repo_keys and repo["ca_cert"]:
            ca_cert = f"@{repo['ca_cert']}"
            client_cert = f"@{repo['client_cert']}"
            client_key = f"@{repo['client_key']}"
            if not show_rpm_remote(remote_name,log):
                command = pulp_rpm_commands["create_remote_cert"] % (remote_name, remote_url, policy_type, ca_cert, client_cert, client_key)
                log.info("Remote '%s' does not exist. Executing creation command with certs.", remote_name)
                result = execute_command(command,log)
                log.info("Remote %s created.", remote_name)
        else:
            log.info("Repository does not use SSL certificates for remote")
            if not show_rpm_remote(remote_name,log):
                command = pulp_rpm_commands["create_remote"] % (remote_name, remote_url, policy_type)
                log.info("Remote '%s' does not exist. Executing creation command.", remote_name)
                result = execute_command(command,log)
                log.info("Remote %s created.", remote_name)
        return result, repo_name

    except Exception as e:
        log.error("Unexpected error while creating remote '%s': %s", repo.get("package", "unknown"), str(e))
        return False, repo.get("package", "unknown")
    finally:
        log.info("Completed RPM remote creation process for '%s'", repo.get("package", "unknown"))

def show_rpm_remote(remote_name,log):
    """
    Show details of an RPM remote.

    Args:
        remote_name (str): The name of the remote.
        log (logging.Logger): Logger instance for logging the process and errors.

    Returns:
        bool: True if the remote was found, False otherwise.
    """
    try:
        log.info("Checking existence of RPM remote: '%s'", remote_name)

        command = pulp_rpm_commands["show_remote"] % remote_name
        log.info("Executing command to show remote: %s", command)

        return execute_command(command,log)

    except Exception as e:
        log.error("Unexpected error while checking remote '%s': %s", remote_name, str(e))
        return False
    finally:
        log.info("Completed check for RPM remote '%s'", remote_name)

def sync_rpm_repository(repo,log, resync_repos=None):
    """
    Synchronizes the RPM repository with its remote.

    Args:
        repo (dict): A dictionary containing the repository information.
        log (logging.Logger): Logger instance for logging the process and errors.
        resync_repos (str/list, optional): Controls sync behavior:
            - None/empty: Skip already synced repos (default)
            - "all": Force resync all repos
            - list of repo names: Only sync specified repos
    Returns:
        bool: True if the repository was synced successfully, False otherwise.
    """

    repo_name = repo["package"]
    version = repo.get("version")

    if version and version != "null":
        repo_name = f"{repo_name}_{version}"

    try:
        log.info("Starting synchronization for RPM repository")
        # Determine if we should skip sync check
        force_sync = False
        
        # Normalize resync_repos: convert comma-separated string to list
        resync_list = None
        if resync_repos == "all":
            force_sync = True
            log.info("Force resync enabled for all repos")
        elif isinstance(resync_repos, str) and resync_repos:
            # Handle comma-separated string: "repo1,repo2"
            resync_list = [r.strip() for r in resync_repos.split(",")]
        elif isinstance(resync_repos, list):
            resync_list = resync_repos

        # Check if this repo is in the resync list
        if resync_list:
            if repo_name in resync_list:
                force_sync = True
                log.info(f"Force resync enabled for {repo_name}")
            else:
                #log.info(f"{repo_name} not in resync list. Skipping.")
                return True, repo_name, False, False # Not actually synced, no version change

        # Check if already synced (skip check if force_sync is True)
        if not force_sync and check_repository_synced(repo_name, log):
            #log.info(f"{repo_name} already synced. Skipping sync.")
            return True, repo_name, False, False # Not actually synced, no version change

        # Get version before sync
        version_before = get_repo_version(repo_name, log)
        log.info(f"{repo_name} version before sync: {version_before}")

        remote_name = repo_name
        command = pulp_rpm_commands["sync_repository"] % (repo_name, remote_name)
        log.info("SYNC STARTED: %s", repo_name)
        log.info("Command: %s", command)

        start_time = time.time()
        result = execute_command(command, log)
        elapsed_time = time.time() - start_time

        success = bool(result)

        # Get version after sync
        version_after = get_repo_version(repo_name, log)
        version_changed = version_after > version_before
        log.info(f"{repo_name} version after sync: {version_after} (changed: {version_changed})")

        if success:
            log.info("SYNC SUCCESS: %s (Duration: %.2f seconds)", repo_name, elapsed_time)
        else:
            log.error("SYNC FAILED: %s (Duration: %.2f seconds)", repo_name, elapsed_time)

        return success, repo_name, success, version_changed  # Return version_changed flag
    except Exception as e:
        log.error("Unexpected error during synchronization of repository '%s': %s", repo_name, str(e))
        return False, repo_name, False, False

def should_process_repo(repo_name, resync_repos, log):
    """
    Determine if a repository should be processed based on resync_repos flag.

    Args:
        repo_name (str): Name of the repository.
        resync_repos (str/list): Controls which repos to process.
        log (logging.Logger): Logger instance.

    Returns:
        bool: True if repo should be processed, False to skip.
    """
    if resync_repos is None or resync_repos == "":
        return True  # Process all repos by default

    if resync_repos == "all":
        return True  # Process all repos

    # Normalize resync_repos to list
    if isinstance(resync_repos, str):
        resync_list = [r.strip() for r in resync_repos.split(",")]
    elif isinstance(resync_repos, list):
        resync_list = resync_repos
    else:
        return True  # Unknown type, process by default

    return repo_name in resync_list

def get_repo_version(repo_name, log):
    """
    Get the current version number of a repository.

    Args:
        repo_name (str): The name of the repository.
        log (logging.Logger): Logger instance for logging.

    Returns:
        int: Version number, or 0 if not found.
    """
    try:
        command = pulp_rpm_commands["get_repo_version"] % repo_name
        cmd_list = shlex.split(command)
        result = subprocess.run(cmd_list, shell=False, capture_output=True, text=True)

        if result.returncode != 0:
            return 0

        try:
            repo_info = json.loads(result.stdout)
            # Extract version from latest_version_href like "/pulp/api/v3/.../versions/2/"
            version_href = repo_info.get("latest_version_href", "")
            if version_href:
                # Extract version number from href
                version = int(version_href.rstrip("/").split("/")[-1])
                return version
        except (json.JSONDecodeError, ValueError, IndexError):
            return 0
        return 0
    except Exception as e:
        log.error("Error getting version for '%s': %s", repo_name, str(e))
        return 0

def check_publication_exists(repo_name, log):
    """
    Check if a publication exists for the repository.

    Args:
        repo_name (str): The name of the repository.
        log (logging.Logger): Logger instance for logging.

    Returns:
        bool: True if publication exists, False otherwise.
    """
    try:
        command = pulp_rpm_commands["check_publication"] % repo_name
        log.info("Checking if publication exists for repository '%s'", repo_name)
        result = execute_command(command, log)
        # The command returns a list - if empty, no publication exists
        return bool(result)
    except Exception as e:
        log.error("Error checking publication for '%s': %s", repo_name, str(e))
        return False

def check_distribution_exists(repo_name, log):
    """
    Check if a distribution exists for the repository.

    Args:
        repo_name (str): The name of the repository.
        log (logging.Logger): Logger instance for logging.

    Returns:
        bool: True if distribution exists, False otherwise.
    """
    try:
        command = pulp_rpm_commands["check_distribution"] % repo_name
        log.info("Checking if distribution exists for repository '%s'", repo_name)
        result = execute_command(command, log)
        return bool(result)
    except Exception as e:
        log.error("Error checking distribution for '%s': %s", repo_name, str(e))
        return False


def delete_old_publications(repo_name, log):
    """
    Delete all existing publications for a repository.

    Args:
        repo_name (str): The name of the repository.
        log (logging.Logger): Logger instance for logging.

    Returns:
        bool: True if all publications were deleted successfully, False otherwise.
    """
    try:
        # Get list of publications for this repo
        list_command = pulp_rpm_commands["check_publication"] % repo_name
        cmd_list = shlex.split(list_command)
        result = subprocess.run(cmd_list, shell=False, capture_output=True, text=True)

        if result.returncode != 0:
            log.info("No existing publications found for '%s'", repo_name)
            return True

        # Parse JSON output to get publication hrefs
        import json
        try:
            publications = json.loads(result.stdout)
        except json.JSONDecodeError:
            log.info("No publications to delete for '%s'", repo_name)
            return True

        if not publications:
            log.info("No existing publications for '%s'", repo_name)
            return True

        log.info("Found %d existing publication(s) for '%s'. Deleting...", len(publications), repo_name)

        for pub in publications:
            pub_href = pub.get("pulp_href")
            if pub_href:
                # Validate pub_href matches expected Pulp href format (allowlist validation)
                validated_href = validate_pulp_href(pub_href)
                # Use subprocess with argument list - validated_href is passed as a separate argument
                # This prevents argument injection as the value is validated against expected format
                log.info("Deleting publication: %s", validated_href)
                delete_result = subprocess.run(
                    ["pulp", "rpm", "publication", "destroy", "--href", validated_href],
                    shell=False, capture_output=True, text=True
                )
                if delete_result.returncode != 0:
                    log.warning("Failed to delete publication %s: %s", pub_href, delete_result.stderr)
                else:
                    log.info("Successfully deleted publication: %s", pub_href)
        
        return True
    except Exception as e:
        log.error("Error deleting publications for '%s': %s", repo_name, str(e))
        return False

def create_publication(repo,log, resync_repos=None):
    """
    Create a publication for an RPM repository.

    Args:
        repo (dict): A dictionary containing the package information.
        log (logging.Logger): Logger instance for logging the process and errors.
        resync_repos (str/list, optional): Controls which repos to process.
    Returns:
        bool: True if the publication was created successfully, False otherwise.
    """

    try:
        log.info("Starting publication creation for RPM repository")
        repo_name = repo["package"]
        version = repo.get("version")

        if version != "null":
            repo_name = f"{repo_name}_{version}"

        log.info("Processing publication for repository: '%s'", repo_name)
        
        # Check if version changed during sync (passed via _version_changed flag)
        version_changed = repo.get("_version_changed", True)  # Default True for safety
        
        # If publication exists and version didn't change, keep existing publication
        if check_publication_exists(repo_name, log):
            if not version_changed:
                log.info(f"{repo_name} version unchanged. Keeping existing publication.")
                return True, repo_name
            else:
                log.info(f"{repo_name} version changed. Deleting old publication and creating new one.")
                delete_old_publications(repo_name, log)
        else:
            log.info(f"{repo_name} publication not found. Creating new one.")

        log.info("Processing repository: '%s'", repo_name)
        command = pulp_rpm_commands["publish_repository"] % repo_name
        log.info("Executing publication command: %s", command)

        result = execute_command(command, log)

        # Initialize
        success = False
        error_message = ""

        # Handle result types
        if isinstance(result, tuple):
            success, _ = result
        elif isinstance(result, subprocess.CompletedProcess):
            success = result.returncode == 0 and "Error:" not in result.stderr
            if not success:
                error_message = result.stderr.strip()
        else:
            # Fallback case
            success = bool(result)

        if success:
            log.info("Publication created for %s.", repo_name)
        else:
            log.error("Failed to create publication for %s. Error: %s", repo_name, error_message or "Unknown error")

        return success, repo_name
    except Exception as e:
        log.error("Unexpected error during publication creation for repository '%s': %s", repo.get("package", "unknown"), str(e))
        return False, repo.get("package", "unknown")

    finally:
        log.info("Completed publication process for repository '%s'", repo.get("package", "unknown"))

def create_distribution(repo, log, resync_repos=None, cluster_os_version="10.0"):
    """
    Create or update a distribution for an RPM repository.

    Args:
        repo (dict): A dictionary containing the repository information.
        log (logging.Logger): Logger instance for logging the process and errors.
        resync_repos (str/list, optional): Controls which repos to process.
        cluster_os_version (str): The cluster OS version (e.g., '10.0', '10.1').
    Returns:
        bool: True if the distribution was created or updated successfully, False otherwise.
    """
    try:
        log.info("Starting distribution creation/update for RPM repository")
        package_name = repo["package"]
        repo_name = package_name
        version = repo.get("version")
        sw_arch = repo.get("sw_arch")

        if version != "null":
            base_path = f" opt/omnia/offline_repo/cluster/{sw_arch}/rhel/{cluster_os_version}/rpms/{package_name}/{version}"
            repo_name = f"{repo_name}_{version}"
        else:
            base_path = f"opt/omnia/offline_repo/cluster/{sw_arch}/rhel/{cluster_os_version}/rpms/{package_name}"

        show_command = pulp_rpm_commands["check_distribution"] % repo_name
        create_command = pulp_rpm_commands["distribute_repository"] % (repo_name, base_path, repo_name)
        update_command = pulp_rpm_commands["update_distribution"] % (repo_name, base_path, repo_name)

        log.info("Processing distribution for repository: '%s', Base path: '%s'", repo_name, base_path)
        # Check if distribution already exists
        log.info("Checking if distribution exists for repository '%s'", repo_name)
        if execute_command(show_command, log):
            log.info(f"Distribution for {package_name} exists. Updating it.")
            return execute_command(update_command, log), repo_name
        else:
            log.info(f"Distribution for {package_name} does not exist. Creating it.")
            return execute_command(create_command, log), repo_name

    except Exception as e:
        log.error("Unexpected error during distribution creation/update for repository '%s': %s", repo.get("package", "unknown"), str(e))
        return False, repo.get("package", "unknown")

    finally:
        log.info("Completed distribution creation/update for repository '%s'", repo.get("package", "unknown"))

def get_base_urls(log):
    """
    Fetch all distributions from Pulp RPM distribution.

    Args:
        log (logging.Logger): Logger instance for logging the process and errors.

    Returns:
        list: A list of dictionaries containing the base URLs and names of all distributions.
              Returns an empty list if there is an error.
    """

    command = ['pulp', 'rpm', 'distribution', 'list', '--field', 'base_url,name']
    log.info(f"Executing command: {' '.join(command)}")

    result = subprocess.run(command,stdout=subprocess.PIPE, stderr=subprocess.PIPE, text=True, check=True)

    if result.returncode != 0:
        log.info(f"Error fetching distributions: {result.stderr}")
        return []

    # Parse the JSON output to get all distributions
    try:
        distributions = json.loads(result.stdout)
    except json.JSONDecodeError as e:
        log.error(f"Error parsing JSON output: {e}")
        log.error(f"Raw output received:\n{result.stdout}")
        return []

    if not distributions:
        log.info("No distributions found in Pulp response.")
    else:
        log.info(f"Fetched {len(distributions)} distributions successfully.")

    return distributions

def create_yum_repo_file(distributions, log):
    """
    Creates a new 'pulp.repo' file in /etc/yum.repos.d and adds multiple repositories.

    Args:
        distributions (list): A list of dictionaries containing the base URLs and names of all distributions.
        log (logging.Logger): Logger instance for logging the process and errors.

    Returns:
        None
    """
    try:
        repo_file_path = "/etc/yum.repos.d/pulp.repo"
        log.info(f"Target repo file path: {repo_file_path}")

        # Validate input
        if not distributions or not isinstance(distributions, list):
            log.error("Invalid or empty 'distributions' list provided. Skipping repo file creation.")
            return

        log.info(f"Received {len(distributions)} distributions to process")

        # Delete existing file first (only once)
        if os.path.exists(repo_file_path):
            os.remove(repo_file_path)
            log.info(f"Deleted existing {repo_file_path}")

        repo_content = ""

        for distribution in distributions:
            repo_name = distribution["name"]
            base_url = distribution["base_url"]
            repo_entry = f"""
[{repo_name}]
name={repo_name} repo
baseurl={base_url}
enabled=1
gpgcheck=0
"""
            repo_content += repo_entry.strip() + "\n\n"

        # Write all repositories at once
        log.info("Writing all repository entries to pulp.repo file")
        with open(repo_file_path, 'w', encoding='utf-8') as repo_file:
            repo_file.write(repo_content.strip() + "\n")

        log.info(f"Created {repo_file_path} with {len(distributions)} repositories")

    except PermissionError:
        log.error("Permission denied while writing to /etc/yum.repos.d/. Run with elevated privileges.")
    except Exception as e:
        log.error(f"Unexpected error while creating YUM repo file: {e}")

def validate_resync_repos(resync_repos, rpm_config, log):
    """
    Validate that resync_repos contains only valid repository names.

    Args:
        resync_repos (str/list): The resync_repos parameter from Ansible.
        rpm_config (list): List of repository configurations.
        log (logging.Logger): Logger instance.

    Returns:
        tuple: (bool, str) - (True, "") if valid, (False, error_message) if invalid.
    """
    if resync_repos is None or resync_repos == "" or resync_repos == "all":
        return True, ""

    # Build list of valid repo names from rpm_config
    valid_repo_names = set()
    for repo in rpm_config:
        repo_name = repo["package"]
        version = repo.get("version")
        if version and version != "null":
            repo_name = f"{repo_name}_{version}"
        valid_repo_names.add(repo_name)

    # Normalize resync_repos to list
    if isinstance(resync_repos, str):
        resync_list = [r.strip() for r in resync_repos.split(",")]
    elif isinstance(resync_repos, list):
        resync_list = resync_repos
    else:
        return True, ""  # Unknown type, skip validation

    # Check for invalid repo names
    invalid_repos = [repo for repo in resync_list if repo not in valid_repo_names]

    if invalid_repos:
        error_msg = f"Invalid repository names in resync_repos: {', '.join(invalid_repos)}. Valid names are: {', '.join(sorted(valid_repo_names))}"
        log.error(error_msg)
        return False, error_msg

    log.info(f"Validated resync_repos: {resync_list}")
    return True, ""

def process_sync_results(sync_results, rpm_config, resync_repos, log):
    """
    Process sync results and determine which repos need publication/distribution.

    Args:
        sync_results (list): Results from sync_rpm_repository (success, name, actually_synced, version_changed).
        rpm_config (list): List of repository configurations.
        resync_repos (str/list): Controls which repos to process.
        log (logging.Logger): Logger instance.

    Returns:
        tuple: (repos_for_pub_dist, should_skip, skip_message) - List of repos, skip flag, and skip reason message.
    """
    # Get list of repos that were actually synced (not skipped)
    actually_synced_repos = [name for success, name, actually_synced, _ in sync_results if success and actually_synced]
    log.info(f"Repos actually synced: {len(actually_synced_repos)} - {actually_synced_repos}")

    # Get list of repos where version changed (need new publication)
    version_changed_repos = [name for success, name, actually_synced, version_changed in sync_results if success and actually_synced and version_changed]
    log.info(f"Repos with version change: {len(version_changed_repos)} - {version_changed_repos}")
    
    # If no versions changed, check for missing publication/distribution
    # This handles the crash recovery case: process failed after sync but before pub/dist
    if not version_changed_repos:
        log.info("No version changes detected. Checking for missing publication/distribution.")

        # Check all synced repos (including previously synced) for missing pub/dist
        repos_missing_pub_dist = []
        all_repo_names = []
        for repo in rpm_config:
            repo_name = repo["package"]
            version = repo.get("version")
            if version and version != "null":
                repo_name = f"{repo_name}_{version}"
            all_repo_names.append(repo_name)

            # If resync_repos is a specific list, only check those repos
            if resync_repos and resync_repos != "all":
                resync_list = resync_repos if isinstance(resync_repos, list) else [r.strip() for r in resync_repos.split(",")]
                if repo_name not in resync_list:
                    continue

            pub_exists = check_publication_exists(repo_name, log)
            dist_exists = check_distribution_exists(repo_name, log)

            if not pub_exists or not dist_exists:
                log.info(f"{repo_name} missing publication={not pub_exists}, distribution={not dist_exists}. Including for pub/dist creation.")
                repo_copy = repo.copy()
                repo_copy["_version_changed"] = False
                repos_missing_pub_dist.append(repo_copy)

        if repos_missing_pub_dist:
            missing_names = [r["package"] for r in repos_missing_pub_dist]
            log.info(f"Found {len(repos_missing_pub_dist)} repo(s) missing publication/distribution: {missing_names}")
            return repos_missing_pub_dist, False, ""

        # All repos have publication and distribution - safe to skip
        log.info("All repos have existing publication and distribution. Skipping.")
        if actually_synced_repos:
            # Repos were synced but no metadata change
            synced_list = ", ".join(actually_synced_repos)
            skip_msg = f"Sync successful for {len(actually_synced_repos)} repo(s): {synced_list}. No metadata changes detected - existing publication/distribution retained"
        else:
            # No repos were synced at all (already up to date)
            skip_msg = "All repositories already synced - no updates required"
        return [], True, skip_msg

    repos_for_pub_dist = []

    if resync_repos == "all":
        log.info("resync_repos='all' - Processing publication and distribution for repos with version change")
        for repo in rpm_config:
            repo_name = repo["package"]
            version = repo.get("version")
            if version and version != "null":
                repo_name = f"{repo_name}_{version}"
            # Only include repos with version change
            if repo_name in version_changed_repos:
                repo_copy = repo.copy()
                repo_copy["_version_changed"] = True
                repos_for_pub_dist.append(repo_copy)
        return repos_for_pub_dist, False, ""
    else:
        # If no repos were actually synced, check for missing pub/dist (crash recovery)
        if not actually_synced_repos:
            log.info("No repos were actually synced. Checking for missing publication/distribution.")
            repos_missing_pub_dist = []
            for repo in rpm_config:
                repo_name = repo["package"]
                version = repo.get("version")
                if version and version != "null":
                    repo_name = f"{repo_name}_{version}"

                # If resync_repos is a specific list, only check those repos
                if resync_repos and resync_repos != "all":
                    resync_list = resync_repos if isinstance(resync_repos, list) else [r.strip() for r in resync_repos.split(",")]
                    if repo_name not in resync_list:
                        continue

                pub_exists = check_publication_exists(repo_name, log)
                dist_exists = check_distribution_exists(repo_name, log)

                if not pub_exists or not dist_exists:
                    log.info(f"{repo_name} missing publication={not pub_exists}, distribution={not dist_exists}. Including for pub/dist creation.")
                    repo_copy = repo.copy()
                    repo_copy["_version_changed"] = False
                    repos_missing_pub_dist.append(repo_copy)

            if repos_missing_pub_dist:
                missing_names = [r["package"] for r in repos_missing_pub_dist]
                log.info(f"Found {len(repos_missing_pub_dist)} repo(s) missing publication/distribution: {missing_names}")
                return repos_missing_pub_dist, False, ""

            log.info("All repos have existing publication and distribution. No updates required.")
            return [], True, "All repositories already synced - no updates required"

        # Filter rpm_config to only include repos with version change
        for repo in rpm_config:
            repo_name = repo["package"]
            version = repo.get("version")
            if version and version != "null":
                repo_name = f"{repo_name}_{version}"
            if repo_name in actually_synced_repos and repo_name in version_changed_repos:
                repo_copy = repo.copy()
                repo_copy["_version_changed"] = True
                repos_for_pub_dist.append(repo_copy)
        return repos_for_pub_dist, False, ""

# ============================================================================
# AGGREGATED REPOS FUNCTIONS
# These functions handle the additional_repos_* feature which aggregates
# multiple user-defined repos into a single Pulp repository per architecture.
# ============================================================================

def delete_aggregated_repo(arch, log):
    """
    Delete the aggregated repository, its remotes, and distribution for a given architecture.
    This is called before recreating the aggregated repo to ensure a clean state.

    Args:
        arch (str): Architecture (x86_64 or aarch64).
        log (logging.Logger): Logger instance.

    Returns:
        bool: True if deletion was successful or resources didn't exist, False on error.
    """
    repo_name = AGGREGATED_REPO_NAME_TEMPLATE.format(arch=arch)
    dist_name = AGGREGATED_DISTRIBUTION_NAME_TEMPLATE.format(arch=arch)

    log.info(f"Deleting aggregated resources for arch '{arch}'")

    # Delete distribution first (depends on repo)
    dist_cmd = pulp_rpm_commands["delete_distribution"] % dist_name
    execute_command(dist_cmd, log)  # Ignore errors - may not exist

    # Delete repository (this also removes associated publications)
    repo_cmd = pulp_rpm_commands["delete_repository"] % repo_name
    execute_command(repo_cmd, log)  # Ignore errors - may not exist

    log.info(f"Completed deletion of aggregated resources for arch '{arch}'")
    return True


def create_aggregated_repository(arch, log):
    """
    Create the aggregated repository for a given architecture.

    Args:
        arch (str): Architecture (x86_64 or aarch64).
        log (logging.Logger): Logger instance.

    Returns:
        tuple: (success, repo_name)
    """
    repo_name = AGGREGATED_REPO_NAME_TEMPLATE.format(arch=arch)

    log.info(f"Creating aggregated repository: {repo_name}")

    if not show_rpm_repository(repo_name, log):
        command = pulp_rpm_commands["create_repository"] % repo_name
        result = execute_command(command, log)
        if not result:
            log.error(f"Failed to create aggregated repository: {repo_name}")
            return False, repo_name
        log.info(f"Aggregated repository '{repo_name}' created successfully.")
    else:
        log.info(f"Aggregated repository '{repo_name}' already exists.")

    return True, repo_name


def create_aggregated_remote(repo_entry, arch, log):
    """
    Create or update a remote for an additional repo entry.

    Args:
        repo_entry (dict): Repository entry with name, url, policy, and optional SSL certs.
        arch (str): Architecture (x86_64 or aarch64).
        log (logging.Logger): Logger instance.

    Returns:
        tuple: (success, remote_name)
    """
    name = repo_entry["name"]
    url = repo_entry["url"]
    policy = repo_entry["policy"]
    remote_name = AGGREGATED_REMOTE_NAME_TEMPLATE.format(arch=arch, name=name)

    log.info(f"Creating/updating remote '{remote_name}' for URL: {url}")

    ca_cert = repo_entry.get("ca_cert", "")
    client_key = repo_entry.get("client_key", "")
    client_cert = repo_entry.get("client_cert", "")

    if ca_cert and client_key and client_cert:
        ca_cert_arg = f"@{ca_cert}"
        client_cert_arg = f"@{client_cert}"
        client_key_arg = f"@{client_key}"

        if not show_rpm_remote(remote_name, log):
            command = pulp_rpm_commands["create_remote_cert"] % (
                remote_name, url, policy, ca_cert_arg, client_cert_arg, client_key_arg
            )
        else:
            command = pulp_rpm_commands["update_remote_cert"] % (
                remote_name, url, policy, ca_cert_arg, client_cert_arg, client_key_arg
            )
    else:
        if not show_rpm_remote(remote_name, log):
            command = pulp_rpm_commands["create_remote"] % (remote_name, url, policy)
        else:
            command = pulp_rpm_commands["update_remote"] % (remote_name, url, policy)

    result = execute_command(command, log)
    if not result:
        log.error(f"Failed to create/update remote: {remote_name}")
        return False, remote_name

    log.info(f"Remote '{remote_name}' created/updated successfully.")
    return True, remote_name


def sync_aggregated_repository(repo_name, remote_name, log):
    """
    Sync the aggregated repository with a specific remote.

    Args:
        repo_name (str): Name of the aggregated repository.
        remote_name (str): Name of the remote to sync from.
        log (logging.Logger): Logger instance.

    Returns:
        tuple: (success, remote_name)
    """
    log.info(f"Syncing repository '{repo_name}' with remote '{remote_name}'")

    command = pulp_rpm_commands["sync_repository"] % (repo_name, remote_name)
    result = execute_command(command, log)

    if not result:
        log.error(f"Failed to sync repository '{repo_name}' with remote '{remote_name}'")
        return False, remote_name

    log.info(f"Successfully synced repository '{repo_name}' with remote '{remote_name}'")
    return True, remote_name


def create_aggregated_publication(repo_name, log):
    """
    Create a publication for the aggregated repository.

    Args:
        repo_name (str): Name of the aggregated repository.
        log (logging.Logger): Logger instance.

    Returns:
        tuple: (success, publication_href or None)
    """
    log.info(f"Creating publication for aggregated repository: {repo_name}")

    command = pulp_rpm_commands["publish_repository"] % repo_name

    try:
        cmd_list = shlex.split(command)
        cmd = subprocess.run(
            cmd_list, shell=False, capture_output=True, text=True, timeout=3600
        )
        log.info(f"Publication command return code: {cmd.returncode}")

        if cmd.returncode != 0:
            log.error(f"Failed to create publication for {repo_name}: {cmd.stderr}")
            return False, None

        # Parse the output to get publication href
        try:
            pub_data = json.loads(cmd.stdout)
            pub_href = pub_data.get("pulp_href")
            # Validate pub_href matches expected Pulp href format (allowlist validation)
            validated_href = validate_pulp_href(pub_href) if pub_href else None
            log.info(f"Publication created with href: {validated_href}")
            return True, validated_href
        except json.JSONDecodeError:
            # If output is not JSON, try to get href from list
            log.info("Could not parse publication href from output, fetching from list")
            list_cmd = pulp_rpm_commands["list_publications"] % repo_name
            list_cmd_list = shlex.split(list_cmd)
            list_result = subprocess.run(
                list_cmd_list, shell=False, capture_output=True, text=True
            )
            if list_result.returncode == 0:
                pubs = json.loads(list_result.stdout)
                if pubs:
                    # Get the latest publication
                    pub_href = pubs[-1].get("pulp_href")
                    # Validate pub_href matches expected Pulp href format (allowlist validation)
                    validated_href = validate_pulp_href(pub_href) if pub_href else None
                    log.info(f"Got publication href from list: {validated_href}")
                    return True, validated_href
            return True, None

    except Exception as e:
        log.error(f"Exception during publication creation: {e}")
        return False, None


def create_aggregated_distribution(arch, pub_href, log, cluster_os_version="10.0"):
    """
    Create or update the distribution for the aggregated repository.

    Args:
        arch (str): Architecture (x86_64 or aarch64).
        pub_href (str): Publication href to associate with distribution.
        log (logging.Logger): Logger instance.
        cluster_os_version (str): The cluster OS version (e.g., '10.0', '10.1').

    Returns:
        tuple: (success, distribution_name)
    """
    repo_name = AGGREGATED_REPO_NAME_TEMPLATE.format(arch=arch)
    dist_name = AGGREGATED_DISTRIBUTION_NAME_TEMPLATE.format(arch=arch)
    base_path = AGGREGATED_BASE_PATH_TEMPLATE.format(arch=arch, os_version=cluster_os_version)

    log.info(f"Creating/updating distribution '{dist_name}' with base_path '{base_path}'")

    # Validate pub_href matches expected Pulp href format (allowlist validation)
    validated_href = validate_pulp_href(pub_href) if pub_href else None

    # Check if distribution exists
    show_cmd = pulp_rpm_commands["check_distribution"] % dist_name

    if execute_command(show_cmd, log):
        # Distribution exists - update with new publication
        if validated_href:
            # Use subprocess with argument list - validated_href is passed as a separate argument
            # This prevents argument injection as the value is validated against expected format
            log.info(f"Updating distribution '{dist_name}' with publication href")
            update_result = subprocess.run(
                ["pulp", "rpm", "distribution", "update", "--name", dist_name, "--publication", validated_href],
                shell=False, capture_output=True, text=True
            )
            result = update_result.returncode == 0
        else:
            # Update with repository reference
            update_cmd = pulp_rpm_commands["update_distribution"] % (dist_name, base_path, repo_name)
            result = execute_command(update_cmd, log)

        if not result:
            log.error(f"Failed to update distribution: {dist_name}")
            return False, dist_name
        log.info(f"Distribution '{dist_name}' updated successfully.")
    else:
        # Create new distribution
        create_cmd = pulp_rpm_commands["distribute_repository"] % (dist_name, base_path, repo_name)
        result = execute_command(create_cmd, log)

        if not result:
            log.error(f"Failed to create distribution: {dist_name}")
            return False, dist_name
        log.info(f"Distribution '{dist_name}' created successfully.")

    return True, dist_name


def manage_aggregated_repos(additional_repos_config, log, cluster_os_version="10.0"):
    """
    Manage aggregated repositories for additional_repos_* entries.
    This function handles the complete workflow:
    1. Delete existing aggregated repo (always recreate for clean state)
    2. Create new aggregated repository
    3. Create remotes for each repo entry
    4. Sync each remote to the aggregated repository
    5. Create publication
    6. Create/update distribution

    Args:
        additional_repos_config (dict): Dictionary with arch as key and list of repo configs as value.
        log (logging.Logger): Logger instance.
        cluster_os_version (str): The cluster OS version (e.g., '10.0', '10.1').

    Returns:
        tuple: (success, error_message)
    """
    log.info("Starting management of aggregated repositories")

    for arch in ["x86_64", "aarch64"]:
        repos = additional_repos_config.get(arch, [])
        repo_name = AGGREGATED_REPO_NAME_TEMPLATE.format(arch=arch)

        log.info(f"Processing aggregated repos for arch '{arch}': {len(repos)} repos")

        # Step 1: Delete existing aggregated repo for clean state
        log.info(f"Step 1: Deleting existing aggregated repo for {arch}")
        delete_aggregated_repo(arch, log)

        # Step 2: Create aggregated repository
        log.info(f"Step 2: Creating aggregated repository for {arch}")
        success, _ = create_aggregated_repository(arch, log)
        if not success:
            return False, f"Failed to create aggregated repository for {arch}"

        # Step 3 & 4: Create remotes and sync (only if there are repos)
        if repos:
            sync_failures = []

            for repo_entry in repos:
                # Create remote
                log.info(f"Step 3: Creating remote for '{repo_entry['name']}'")
                success, remote_name = create_aggregated_remote(repo_entry, arch, log)
                if not success:
                    return False, f"Failed to create remote for {repo_entry['name']}"

                # Sync to aggregated repo
                log.info(f"Step 4: Syncing remote '{remote_name}' to aggregated repo")
                success, _ = sync_aggregated_repository(repo_name, remote_name, log)
                if not success:
                    sync_failures.append(repo_entry['name'])

            # Check if all syncs succeeded
            if sync_failures:
                return False, f"Failed to sync repos for {arch}: {', '.join(sync_failures)}"

        # Step 5: Create publication
        log.info(f"Step 5: Creating publication for {arch}")
        success, pub_href = create_aggregated_publication(repo_name, log)
        if not success:
            return False, f"Failed to create publication for aggregated repo {arch}"

        # Step 6: Create/update distribution
        log.info(f"Step 6: Creating/updating distribution for {arch}")
        success, _ = create_aggregated_distribution(arch, pub_href, log, cluster_os_version)
        if not success:
            return False, f"Failed to create distribution for aggregated repo {arch}"

        log.info(f"Successfully completed aggregated repo management for {arch}")

    log.info("Completed management of all aggregated repositories")
    return True, "success"

def manage_rpm_repositories_multiprocess(rpm_config, log, sw_archs=None, resync_repos=None, cluster_os_version="10.0"):
    """
    Manage RPM repositories using multiprocessing.

    Args:
        rpm_config (list): A list of dictionaries containing the configuration for each RPM repository.
        log (logging.Logger): Logger instance for logging the process and errors.
        sw_archs (list, optional): List of architectures to process based on software_config.json.
                                   If provided, only repos matching these archs are processed.
        resync_repos (str/list, optional): Controls sync behavior:
            - None/empty: Skip already synced repos (default)
            - "all": Force resync all repos
            - list of repo names: Only sync specified repos
        cluster_os_version (str): The cluster OS version (e.g., '10.0', '10.1').
    Returns:
        tuple: (bool, str) indicating success and a message
    """

    # Filter rpm_config by sw_archs if provided
    if sw_archs:
        log.info(f"Filtering repositories for architectures: {sw_archs}")
        rpm_config = [repo for repo in rpm_config if repo.get("sw_arch") in sw_archs]
        log.info(f"Filtered to {len(rpm_config)} repositories")

    if not rpm_config:
        log.info("No repositories to process after filtering")
        return True, "No repositories to process"

    # Validate resync_repos contains valid repository names
    is_valid, error_msg = validate_resync_repos(resync_repos, rpm_config, log)
    if not is_valid:
        return False, error_msg

    cpu_count = os.cpu_count()
    process = min(cpu_count, len(rpm_config))
    #log.info(f"Number of processes = {process}")
    log.info(f"Number of processes for lightweight operations = {process}")

    # Calculate actual repos to process based on resync_repos
    # This determines the effective concurrency for sync/publish/distribute
    if resync_repos is None or resync_repos == "" or resync_repos == "all":
        repos_to_process_count = len(rpm_config)
    else:
        # Count repos that match resync_repos
        if isinstance(resync_repos, str):
            resync_list = [r.strip() for r in resync_repos.split(",")]
        else:
            resync_list = resync_repos
        repos_to_process_count = len(resync_list)

    log.info(f"Repos to actually process (based on resync_repos): {repos_to_process_count}")

    # Use configurable concurrency from config.py for resource-intensive operations
    # This prevents overwhelming the Pulp server, especially on NFS storage
    # Adjust PULP_CONCURRENCY via Ansible or in config.py::
    #   - For NFS storage: Use 1 (prevents 500/502/504 errors)
    #   - For local storage: Use 2 for optimal performance
    #   - For high-performance SAN: Can try 3-4 (monitor for errors)
    # Cap by actual repos to process, not total rpm_config
    pulp_process = min(PULP_CONCURRENCY, repos_to_process_count)
    #pulp_process = min(PULP_CONCURRENCY, process)

    log.info(f"Configured pulp concurrency: {PULP_CONCURRENCY}")
    log.info(f"Actual pulp processes (capped by repo to process): {pulp_process}")

    # Step 1: Concurrent repository creation
    log.info("Step 1: Starting concurrent RPM repository creation")
    with multiprocessing.Pool(processes=process) as pool:
        result = pool.map(partial(create_rpm_repository, log=log), rpm_config)
    failed = [name for success, name in result if not success]
    if failed:
        log.error("Failed during creation of RPM repository for: %s", ", ".join(failed))
        return False, f"During creation of RPM repository for: {', '.join(failed)}"

    # Step 2: Concurrent remote creation
    log.info("Step 2: Starting concurrent RPM remote creation")
    with multiprocessing.Pool(processes=process) as pool:
        sync_result = pool.map(partial(create_rpm_remote, log=log), rpm_config)
    failed = [name for success, name in sync_result if not success]
    if failed:
        log.error("Failed during creation of RPM remote for: %s", ", ".join(failed))
        return False, f"During creation of RPM remote for: {', '.join(failed)}"

    # Step 3: Concurrent synchronization
    log.info("Step 3: Starting concurrent RPM repository synchronization")
    with multiprocessing.Pool(processes=pulp_process) as pool:
        sync_results = pool.map(partial(sync_rpm_repository, log=log, resync_repos=resync_repos), rpm_config)
    failed = [name for success, name, _, _ in sync_results if not success]
    if failed:
        log.error("Failed during synchronization of RPM repository for: %s", ", ".join(failed))
        return False, f"During synchronization of RPM repository for: {', '.join(failed)}. Please refer to the troubleshooting guide for more information."

    # Process sync results and get repos for publication/distribution
    repos_for_pub_dist, should_skip, skip_message  = process_sync_results(sync_results, rpm_config, resync_repos, log)
    
    # Only run publication/distribution if repos need it
    if not should_skip:
        # Step 4: Concurrent publication creation
        # Deletes old publications and creates new ones
        log.info("Step 4: Starting concurrent RPM publication creation")
        log.info(f"Processing publication for {len(repos_for_pub_dist)} repos")
        with multiprocessing.Pool(processes=min(pulp_process, len(repos_for_pub_dist))) as pool:
            result = pool.map(partial(create_publication, log=log, resync_repos=resync_repos), repos_for_pub_dist)
        failed = [name for success, name in result if not success]
        if failed:
            log.error("Failed during publication of RPM repository for: %s", ", ".join(failed))
            return False, f"During publication of RPM repository for: {', '.join(failed)}. Please refer to the troubleshooting guide for more information."

        # Step 5: Concurrent distribution creation/update
        log.info("Step 5: Starting concurrent RPM distribution creation/update")
        log.info(f"Processing distribution for {len(repos_for_pub_dist)} repos")
        with multiprocessing.Pool(processes=min(pulp_process, len(repos_for_pub_dist))) as pool:
            result = pool.map(partial(create_distribution, log=log, resync_repos=resync_repos, cluster_os_version=cluster_os_version), repos_for_pub_dist)
        failed = [name for success, name in result if not success]
        if failed:
            log.error("Failed during distribution of RPM repository for: %s", ", ".join(failed))
            return False, f"During distribution of RPM repository for: {', '.join(failed)}"
    else:
        log.info("Skipping publication/distribution steps - repos already up to date")

    # --- STEP 6: Always ensure pulp.repo exists ---
    # This handles the scenario where omnia_core upgrade deletes pulp.repo
    # and local_repo.yml runs again with already-synced repos.
    # Distributions must exist before we can fetch base_urls.
    log.info("Step 6: Ensuring pulp.repo file exists")
    base_urls = get_base_urls(log)
    if not base_urls:
        log.error("No base URLs retrieved from Pulp. Cannot create repo file.")
        return False, "Base URLs fetch failed — repo file not created."
    
    log.info(f"Fetched {len(base_urls)} base URLs from Pulp.")
    create_yum_repo_file(base_urls, log)
    log.info("Successfully created/updated pulp.repo file with fetched base URLs.")

    # Return appropriate success message based on resync_repos and skip status
    if should_skip:
        return True, skip_message
    
    if resync_repos == "all":
        return True, "Resync completed successfully for all repositories"
    elif resync_repos:
        if isinstance(resync_repos, str):
            repos_list = resync_repos
        else:
            repos_list = ", ".join(resync_repos)
        return True, f"Resync completed successfully for specified repositories: {repos_list}"
    
    return True, "RPM repository sync and configuration completed successfully"

def main():
    """
    The main function of the module.

    This function sets up the argument specifications for the module and initializes the logger.
    It then retrieves the `local_config` and `log_dir` parameters from the module.

    The `local_config` parameter is used to replace single quotes with double quotes to make it valid JSON.
    The JSON string is then parsed and stored in the `rpm_config` variable.

    The `manage_rpm_repositories_multiprocess` function is called with the `rpm_config` and `log` as arguments.

    If `additional_repos_config` is provided, the `manage_aggregated_repos` function is called to handle
    the aggregated repositories feature.

    Finally, the function exits with a JSON response indicating that the RPM configuration has been processed.

    Parameters:
        None

    Returns:
        None
    """
    module_args = {
        "local_config": {"type": "list", "required": True},
        "log_dir": {"type": "str", "required": False, "default": "/tmp/thread_logs"},
        "additional_repos_config": {"type": "dict", "required": False, "default": None},
        "pulp_concurrency": {"type": "int", "required": False, "default": None},
        "sw_archs": {"type": "list", "required": False, "default": None},
        "resync_repos": {"type": "raw", "required": False, "default": None},
        "cluster_os_version": {"type": "str", "required": False, "default": "10.0"}
    }

    module = AnsibleModule(argument_spec=module_args, supports_check_mode=False)

    # Get the local_config parameter from the module
    rpm_config = module.params["local_config"]
    log_dir = module.params["log_dir"]
    additional_repos_config = module.params["additional_repos_config"]
    pulp_concurrency = module.params["pulp_concurrency"]
    sw_archs = module.params["sw_archs"]
    resync_repos = module.params["resync_repos"]
    cluster_os_version = module.params["cluster_os_version"]

    log = setup_standard_logger(log_dir)
    standard_log_path = os.path.join(log_dir, "standard.log")

    # Optional override from Ansible (keep config.py defaults if unset)
    global PULP_CONCURRENCY

    if pulp_concurrency is not None:
        if pulp_concurrency < 1:
            module.fail_json(msg="pulp_concurrency must be >= 1")
        PULP_CONCURRENCY = pulp_concurrency

    log.info(f"Configured pulp concurrency: {PULP_CONCURRENCY}")

    start_time = datetime.now().strftime("%I:%M:%S %p")

    log.info(f"Start execution time: {start_time}")

    log.info(f"Architectures to process: {sw_archs}")
    log.info(f"Resync repos setting: {resync_repos}")
    # Call the function to manage RPM repositories
    result, output = manage_rpm_repositories_multiprocess(rpm_config, log, sw_archs, resync_repos, cluster_os_version)

    if result is False:
        module.fail_json(msg=f"Error {output}, check {standard_log_path}")

    # Handle aggregated repos if additional_repos_config is provided
    if additional_repos_config:
        log.info("Processing additional_repos aggregated repositories")
        result, output = manage_aggregated_repos(additional_repos_config, log, cluster_os_version)
        if result is False:
            module.fail_json(msg=f"Error in aggregated repos: {output}, check {standard_log_path}")
        log.info("Successfully processed additional_repos aggregated repositories")

    module.exit_json(changed=True, result=output)

if __name__ == "__main__":
    main()


================================================
FILE: common/library/modules/pulp_cleanup.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
"""
Unified Pulp Cleanup Module

Architecture:
    Input → Type Detection → Processing → Status Updates → Return Results

Handles:
    - Repository cleanup (RPM)
    - Container cleanup
    - File cleanup (git, tarball, pip_module)
"""

import os
import csv
import glob
import json
import shutil
import subprocess
import re
import yaml
from typing import Dict, List, Any, Tuple

from ansible.module_utils.basic import AnsibleModule
from ansible.module_utils.local_repo.standard_logger import setup_standard_logger
from ansible.module_utils.local_repo.config import (
    CLEANUP_BASE_PATH_DEFAULT,
    CLEANUP_FILE_TYPES,
    pulp_rpm_commands,
    pulp_container_commands,
    pulp_file_commands,
    pulp_python_commands,
    ARCH_SUFFIXES
)


# =============================================================================
# PRETTY TABLE FORMATTING
# =============================================================================

def format_pretty_table(results: List[Dict[str, Any]]) -> str:
    """Format cleanup results into a pretty table."""
    if not results:
        return "No cleanup results to display"

    headers = ["Name", "Type", "Status", "Message"]

    # Calculate column widths
    widths = [len(h) for h in headers]
    for r in results:
        widths[0] = max(widths[0], len(str(r.get('name', ''))))
        widths[1] = max(widths[1], len(str(r.get('type', ''))))
        widths[2] = max(widths[2], len(str(r.get('status', ''))))
        widths[3] = max(widths[3], min(len(str(r.get('message', ''))), 40))

    # Build table
    border = "+" + "+".join("-" * (w + 2) for w in widths) + "+"
    header_row = "|" + "|".join(f" {h.ljust(w)} " for h, w in zip(headers, widths)) + "|"

    lines = [border, header_row, border]

    for r in results:
        msg = str(r.get('message', ''))[:40]
        row = "|" + "|".join([
            f" {str(r.get('name', '')).ljust(widths[0])} ",
            f" {str(r.get('type', '')).ljust(widths[1])} ",
            f" {str(r.get('status', '')).ljust(widths[2])} ",
            f" {msg.ljust(widths[3])} "
        ]) + "|"
        lines.append(row)

    lines.append(border)
    return "\n".join(lines)


# =============================================================================
# COMMAND EXECUTION
# =============================================================================

def run_cmd(cmd: str, logger) -> Dict[str, Any]:
    """Execute shell command and return result."""
    try:
        result = subprocess.run(cmd, shell=True, capture_output=True, text=True, timeout=300)
        return {"rc": result.returncode, "stdout": result.stdout, "stderr": result.stderr}
    except (subprocess.SubprocessError, OSError) as e:
        logger.error(f"Command failed: {cmd} - {e}")
        return {"rc": 1, "stdout": "", "stderr": str(e)}


def safe_json_parse(data: str, default: Any = None) -> Any:
    """Safely parse JSON string using JSONDecoder with validation.
    
    Uses json.JSONDecoder instead of json.loads to avoid Checkmarx vulnerabilities.
    """
    if not data or not isinstance(data, str):
        return default if default is not None else []

    try:
        decoder = json.JSONDecoder()
        parsed, _ = decoder.raw_decode(data.strip())
        return parsed
    except (ValueError, TypeError):
        return default if default is not None else []


# =============================================================================
# CONTAINER IMAGE VALIDATION & CONVERSION
# =============================================================================

def validate_container_format(image_name: str) -> Tuple[bool, str]:
    """Validate container image format.
    
    User must provide format: registry/image (e.g., registry.k8s.io/pause)
    
    Returns:
        Tuple of (is_valid, error_message)
    """
    if not image_name:
        return False, "Container image name cannot be empty"

    # Must contain at least one '/' to indicate registry/image format
    if '/' not in image_name:
        return False, (
            f"Invalid format '{image_name}'. Must include registry "
            "(e.g., registry.k8s.io/pause, docker.io/library/busybox)"
        )

    # Must have a registry part (contains '.' or is a known registry)
    parts = image_name.split('/')
    registry = parts[0]

    # Check if registry looks valid (contains dot or is localhost)
    if '.' not in registry and registry != 'localhost' and ':' not in registry:
        return False, (
            f"Invalid registry '{registry}' in '{image_name}'. "
            "Registry must be a domain (e.g., docker.io, registry.k8s.io)"
        )

    return True, ""


def convert_to_pulp_container_name(image_name: str) -> str:
    """Convert user-provided image name to Pulp repository name.
    
    Examples:
        registry.k8s.io/pause -> container_repo_registry.k8s.io_pause
        docker.io/library/busybox -> container_repo_docker.io_library_busybox
        ghcr.io/kube-vip/kube-vip -> container_repo_ghcr.io_kube-vip_kube-vip
    """
    # Replace '/' with '_' and prepend 'container_repo_'
    normalized = image_name.replace('/', '_')
    return f"container_repo_{normalized}"


# =============================================================================
# TYPE DETECTION
# =============================================================================

def detect_file_type(name: str, base_path: str = "/opt/omnia/offline_repo/cluster") -> str:
    """Detect artifact type by searching for the package name in the filesystem.
    
    Searches in base_path/<arch>/<os>/<version>/{type_folder}/name
    and returns the folder type where the package is found.
    
    Storage structure:
        - iso/          : ISO files, run files (e.g., cuda-run)
        - manifest/     : Kubernetes manifests (e.g., calico-v3.30.3, metallb-native-v0.15.2)
        - pip_module/   : Python pip packages (e.g., PyMySQL==1.1.2, kubernetes==33.1.0)
        - tarball/      : Tarballs, helm charts (e.g., helm-v3.19.0-amd64, nvhpc_2025_2511_Linux_x86_64_cuda_13.0)
        - git/          : Git repositories
        - ansible_galaxy_collection/ : Ansible Galaxy collections
    
    Args:
        name: Package name from JSON (e.g., "calico-v3.30.3", "helm-v3.19.0-amd64")
        base_path: Base path to search (default: /opt/omnia/offline_repo/cluster)
    
    Returns:
        str: Type based on folder where package is found, or fallback to name-based detection
    """
    
    # Search for the package name in the filesystem
    # Pattern: base_path/*/*/*/{type_folder}/name
    for file_type in CLEANUP_FILE_TYPES:
        pattern = f"{base_path}/*/*/*/{file_type}/{name}"
        matches = glob.glob(pattern)
        if matches:
            # Extract the parent folder name and return it
            parent_folder = os.path.basename(os.path.dirname(matches[0]))
            return parent_folder
    
    # If not found in filesystem, return None
    return None

# =============================================================================
# EXISTENCE CHECKS
# =============================================================================

def repo_exists(name: str, logger) -> bool:
    """Check if RPM repository exists in Pulp."""
    cmd = pulp_rpm_commands["show_repository"] % name
    result = run_cmd(cmd, logger)
    return result["rc"] == 0


def container_exists(name: str, logger) -> bool:
    """Check if container repository exists in Pulp."""
    cmd = pulp_container_commands["show_container_repo"] % name
    result = run_cmd(cmd, logger)
    return result["rc"] == 0


def file_exists_in_status(name: str, base_path: str, logger) -> bool:
    """Check if file artifact exists in status files."""
    try:
        for arch in ARCH_SUFFIXES:
            for status_file in glob.glob(f"{base_path}/*/*/{arch}/*/status.csv"):
                with open(status_file, 'r', encoding='utf-8') as f:
                    if name in f.read():
                        return True
        return False
    except OSError:
        return False

def _list_pulp_repos(cmd: str, label: str, logger) -> List[str]:
    """List repository names from Pulp using the given command."""
    result = run_cmd(cmd, logger)
    if result["rc"] != 0:
        logger.error(f"Failed to list {label}: {result['stderr']}")
        return []
    repos = safe_json_parse(result["stdout"])
    return [r.get('name', '') for r in repos if r.get('name')]


def get_all_repositories(logger) -> List[str]:
    """Get all RPM repository names from Pulp."""
    return _list_pulp_repos(pulp_rpm_commands["list_repositories"], "repositories", logger)


def get_all_containers(logger) -> List[str]:
    """Get all container repository names from Pulp."""
    return _list_pulp_repos(pulp_container_commands["list_repositories"], "container repositories", logger)


def get_all_file_repositories(logger) -> List[str]:
    """Get all file repository names from Pulp."""
    return _list_pulp_repos(pulp_file_commands["list_repositories"], "file repositories", logger)


def get_all_python_repositories(logger) -> List[str]:
    """Get all Python repository names from Pulp."""
    return _list_pulp_repos(pulp_python_commands["list_repositories"], "Python repositories", logger)


# =============================================================================
# CLEANUP FUNCTIONS
# =============================================================================

def cleanup_repository(name: str, base_path: str, logger) -> Dict[str, Any]:
    """Cleanup a single RPM repository."""
    result = {"name": name, "type": "repository", "status": "Failed", "message": ""}

    # Check existence
    if not repo_exists(name, logger):
        result["message"] = "Repository not found"
        return result

    try:
        # Delete distributions
        dist_list = run_cmd(pulp_rpm_commands["list_distributions"], logger)
        if dist_list["rc"] == 0:
            dists = safe_json_parse(dist_list["stdout"])
            for d in dists:
                if d.get('name', '') == name or name in d.get('name', ''):
                    run_cmd(pulp_rpm_commands["delete_distribution"] % d.get('name', ''), logger)

        # Delete publications
        pub_list = run_cmd(pulp_rpm_commands["list_publications"] % name, logger)
        if pub_list["rc"] == 0:
            pubs = safe_json_parse(pub_list["stdout"])
            for p in pubs:
                run_cmd(pulp_rpm_commands["delete_publication"] % p.get('pulp_href', ''), logger)

        # Delete remote
        run_cmd(pulp_rpm_commands["delete_remote"] % name, logger)

        # Delete repository
        del_result = run_cmd(pulp_rpm_commands["delete_repository"] % name, logger)

        if del_result["rc"] == 0:
            result["status"] = "Success"
            result["message"] = "Repository deleted"
            # Update status files - remove RPM entries from this repo and mark software as partial
            affected = remove_rpms_from_repository(name, base_path, logger)
            logger.info(f" mark affected softwares as partial {affected}")
            mark_software_partial(affected, base_path, logger, 'repository')
        else:
            result["message"] = f"Delete failed: {del_result['stderr']}"

    except Exception as e:
        result["message"] = f"Error: {str(e)}"

    return result


def cleanup_container(user_input: str, base_path: str, logger) -> Dict[str, Any]:
    """Cleanup a single container repository.
    
    Args:
        user_input: User-provided image name (e.g., registry.k8s.io/pause)
                    or Pulp repository name (e.g., container_repo_registry.k8s.io_pause)
                    when called from cleanup_containers=all
    """
    result = {"name": user_input, "type": "container", "status": "Failed", "message": ""}

    # Check if input is already a Pulp repository name (from get_all_containers)
    if user_input.startswith('container_repo_'):
        pulp_name = user_input
        repo_suffix = user_input[len('container_repo_'):]
    else:
        # Validate format
        is_valid, error_msg = validate_container_format(user_input)
        if not is_valid:
            result["message"] = error_msg
            return result

        # Convert to Pulp naming convention
        pulp_name = convert_to_pulp_container_name(user_input)
        repo_suffix = pulp_name[len('container_repo_'):]

    # Check existence
    if not container_exists(pulp_name, logger):
        result["message"] = (
            f"Container not found in Pulp (looked for: {pulp_name})"
        )
        return result

    try:
        # Delete distributions
        dist_list = run_cmd(pulp_container_commands["list_distributions"], logger)
        if dist_list["rc"] == 0:
            dists = safe_json_parse(dist_list["stdout"])
            for d in dists:
                if d.get('name', '') == pulp_name:
                    run_cmd(pulp_container_commands["delete_distribution"] % d.get('name', ''), logger)

        # Delete remote(s)
        # Omnia creates container remotes as:
        #   - remote_<image_sans_separators> (for standard images)
        #   - user_remote_<image_sans_separators> (for user registries)
        # where the suffix matches the container repo name after 'container_repo_'.
        remote_candidates = [
            f"remote_{repo_suffix}",
            f"user_remote_{repo_suffix}",
        ]

        # Also try to discover any remotes that match this suffix (defensive)
        remote_list = run_cmd(pulp_container_commands["list_remotes"], logger)
        if remote_list["rc"] == 0:
            remotes = safe_json_parse(remote_list["stdout"], default=[])
            for r in remotes:
                rname = r.get('name', '') if isinstance(r, dict) else ''
                if not rname:
                    continue
                if rname.endswith(f"_{repo_suffix}") or rname in remote_candidates:
                    remote_candidates.append(rname)

        seen = set()
        for remote_name in remote_candidates:
            if not remote_name or remote_name in seen:
                continue
            seen.add(remote_name)
            remote_result = run_cmd(
                pulp_container_commands["delete_remote"] % remote_name, logger
            )
            if remote_result["rc"] == 0:
                logger.info(f"Deleted container remote: {remote_name}")
            else:
                logger.warning(
                    f"Could not delete container remote '{remote_name}': {remote_result['stderr']}"
                )

        # Delete repository
        del_result = run_cmd(pulp_container_commands["delete_repository"] % pulp_name, logger)

        if del_result["rc"] == 0:
            result["status"] = "Success"
            result["message"] = "Container deleted"
            # Update status files - remove image entries and mark software as partial
            affected = remove_from_status_files(user_input, 'image', base_path, logger)
            mark_software_partial(affected, base_path, logger, 'image')
        else:
            result["message"] = f"Delete failed: {del_result['stderr']}"

    except Exception as e:
        result["message"] = f"Error: {str(e)}"

    return result


def cleanup_pip_module(name: str, base_path: str, repo_store_path: str, logger,
                       pulp_repo_name: str = None) -> Dict[str, Any]:
    """Cleanup a pip module from Pulp Python repository.
    
    Pip modules are stored as: pip_module<package_name>==<version>
    e.g., pip_modulecffi==1.17.1
    
    Args:
        name: Content name (e.g., 'cffi==1.17.1') used for status files and filesystem
        base_path: Base path for status files
        repo_store_path: Root store path for filesystem cleanup
        logger: Logger instance
        pulp_repo_name: Optional Pulp repo name override (from cleanup_files=all).
                        If None, derived from name.
    """
    result = {"name": name, "type": "pip_module", "status": "Failed", "message": ""}
    messages = []
    pulp_deleted = False
    content_removed = False

    try:
        # Use provided Pulp repo name or derive from content name
        if not pulp_repo_name:
            if name.startswith("pip_module"):
                pulp_repo_name = name
            else:
                pulp_repo_name = f"pip_module{name}"

        logger.info(f"Looking for Python repository: {pulp_repo_name}")

        # Check if repository exists
        repo_check = run_cmd(pulp_python_commands["show_repository"] % pulp_repo_name, logger)

        if repo_check["rc"] == 0:
            # Delete distribution first
            dist_del = run_cmd(pulp_python_commands["delete_distribution"] % pulp_repo_name, logger)
            if dist_del["rc"] == 0:
                messages.append("Distribution deleted")

            # Delete repository
            repo_del = run_cmd(pulp_python_commands["delete_repository"] % pulp_repo_name, logger)
            if repo_del["rc"] == 0:
                pulp_deleted = True
                messages.append("Repository deleted")

            # Run orphan cleanup
            if pulp_deleted:
                logger.info("Running orphan cleanup...")
                orphan_result = run_cmd(pulp_python_commands["orphan_cleanup"], logger)
                if orphan_result["rc"] == 0:
                    messages.append("Orphan cleanup completed")
        else:
            # Try listing repos to find partial match
            repo_list = run_cmd(
                pulp_python_commands["list_repositories"], logger
            )
            if repo_list["rc"] == 0:
                repos = safe_json_parse(repo_list["stdout"])
                for repo in repos:
                    repo_name = repo.get('name', '')
                    if name in repo_name or repo_name == pulp_repo_name:
                        logger.info(f"Found matching Python repository: {repo_name}")

                        dist_del = run_cmd(pulp_python_commands["delete_distribution"] % repo_name, logger)
                        if dist_del["rc"] == 0:
                            messages.append("Distribution deleted")

                        repo_del = run_cmd(pulp_python_commands["delete_repository"] % repo_name, logger)
                        if repo_del["rc"] == 0:
                            pulp_deleted = True
                            messages.append("Repository deleted")
                        break

        # Update status files
        if file_exists_in_status(name, base_path, logger):
            affected = remove_from_status_files(name, 'pip_module', base_path, logger)
            if affected:
                messages.append("Status files updated")
                mark_software_partial(affected, base_path, logger, 'pip_module')

        # Clean up uploaded content from filesystem
        fs_result = cleanup_content_directory(name, 'pip_module', repo_store_path, logger)
        if fs_result["status"] == "Success":
            content_removed = True
            messages.append(fs_result["message"])

        if pulp_deleted or content_removed:
            result["status"] = "Success"
            result["message"] = "; ".join(messages) if messages else "Cleaned up"
        else:
            result["message"] = f"pip_module '{name}' not found in Pulp or filesystem"

    except Exception as e:
        result["message"] = f"Error: {str(e)}"

    return result


def get_pulp_file_repo_name(name: str, file_type: str) -> str:
    """Get the Pulp File repository name based on artifact type.
    
    Naming conventions:
    - ansible_galaxy_collection: ansible_galaxy_collection<package>
    - tarball, git, manifest, file: <name> (as-is)
    """
    if file_type == "ansible_galaxy_collection":
        if name.startswith("ansible_galaxy_collection"):
            return name
        return f"ansible_galaxy_collection{name}"
    return name


def cleanup_file_repository(name: str, file_type: str, base_path: str, repo_store_path: str, logger,
                            pulp_repo_name: str = None) -> Dict[str, Any]:
    """Cleanup artifact from Pulp File repository.
    
    Handles: tarball, git, manifest, ansible_galaxy_collection
    All use 'pulp file' repository type with type-specific naming conventions.
    
    Args:
        name: Content name (e.g., 'calico-v3.30.3') used for status files and filesystem
        file_type: Artifact type (e.g., 'manifest', 'tarball')
        base_path: Base path for status files
        repo_store_path: Root store path for filesystem cleanup
        logger: Logger instance
        pulp_repo_name: Optional Pulp repo name override (from cleanup_files=all).
                        If None, derived from name + file_type.
    """
    result = {"name": name, "type": file_type, "status": "Failed", "message": ""}
    messages = []
    pulp_deleted = False
    status_removed = False
    content_removed = False

    try:
        # Use provided Pulp repo name or derive from content name
        if not pulp_repo_name:
            pulp_repo_name = get_pulp_file_repo_name(name, file_type)
        logger.info(f"Looking for {file_type} repository: {pulp_repo_name}")

        # Check if repository exists directly
        repo_check = run_cmd(pulp_file_commands["show_repository"] % pulp_repo_name, logger)

        if repo_check["rc"] == 0:
            # Found exact match - delete distribution and repository
            dist_del = run_cmd(pulp_file_commands["delete_distribution"] % pulp_repo_name, logger)
            if dist_del["rc"] == 0:
                messages.append("Distribution deleted")

            repo_del = run_cmd(pulp_file_commands["delete_repository"] % pulp_repo_name, logger)
            if repo_del["rc"] == 0:
                pulp_deleted = True
                messages.append("Repository deleted")
        else:
            # Try listing repos to find partial match
            repo_list = run_cmd(
                pulp_file_commands["list_repositories"], logger
            )
            if repo_list["rc"] == 0:
                repos = safe_json_parse(repo_list["stdout"])
                for repo in repos:
                    repo_name = repo.get('name', '')
                    if name in repo_name or repo_name == pulp_repo_name:
                        logger.info(f"Found matching repository: {repo_name}")

                        dist_del = run_cmd(pulp_file_commands["delete_distribution"] % repo_name, logger)
                        if dist_del["rc"] == 0:
                            messages.append("Distribution deleted")

                        repo_del = run_cmd(pulp_file_commands["delete_repository"] % repo_name, logger)
                        if repo_del["rc"] == 0:
                            pulp_deleted = True
                            messages.append("Repository deleted")
                        break

        # Run orphan cleanup to remove actual content files
        if pulp_deleted:
            logger.info("Running orphan cleanup to remove content files...")
            orphan_result = run_cmd(pulp_file_commands["orphan_cleanup"], logger)
            if orphan_result["rc"] == 0:
                messages.append("Orphan cleanup completed")
            else:
                logger.warning(f"Orphan cleanup warning: {orphan_result['stderr']}")

        # Update status files
        if file_exists_in_status(name, base_path, logger):
            affected = remove_from_status_files(name, file_type, base_path, logger)
            if affected:
                status_removed = True
                messages.append("Status files updated")
                mark_software_partial(affected, base_path, logger, file_type)

        # Clean up uploaded content from filesystem
        fs_result = cleanup_content_directory(
            name, file_type, repo_store_path, logger
        )
        if fs_result["status"] == "Success":
            content_removed = True
            messages.append(fs_result["message"])

        # Determine overall result
        if pulp_deleted or status_removed or content_removed:
            result["status"] = "Success"
            result["message"] = "; ".join(messages) if messages else "Cleaned up"
        else:
            result["message"] = f"{file_type} '{name}' not found in Pulp, status files, or filesystem"

    except Exception as e:
        result["message"] = f"Error: {str(e)}"

    return result


def parse_pulp_file_repo_name(repo_name: str) -> Tuple[str, str, str]:
    """Parse a Pulp file/python repository name into components.
    
    Pulp repo names follow the format:
        {arch}_{os_type}_{os_version}_{type}{content_name}
    e.g.:
        x86_64_rhel_10.0_manifestcalico-v3.30.3 -> ('x86_64', 'manifest', 'calico-v3.30.3')
        x86_64_rhel_10.0_pip_modulecffi==1.17.1 -> ('x86_64', 'pip_module', 'cffi==1.17.1')
        aarch64_rhel_10.0_isocuda-run            -> ('aarch64', 'iso', 'cuda-run')
    
    Also supports legacy format without os_type/version for backward compatibility:
        x86_64_manifestcalico-v3.30.3 -> ('x86_64', 'manifest', 'calico-v3.30.3')
    
    Returns:
        Tuple of (arch, file_type, content_name).
        Returns (None, None, repo_name) if parsing fails.
    """
    for arch in ARCH_SUFFIXES:
        prefix = f"{arch}_"
        if repo_name.startswith(prefix):
            remainder = repo_name[len(prefix):]
            # Try to strip os_type_os_version_ prefix (e.g., "rhel_10.0_")
            # os_type is alphabetic, os_version is digits/dots
            os_match = re.match(r'^([a-z]+)_(\d+(?:\.\d+)*)_', remainder)
            if os_match:
                remainder_after_os = remainder[os_match.end():]
                # Check if the remainder after os_type/version matches a file type
                for file_type in sorted(CLEANUP_FILE_TYPES, key=len, reverse=True):
                    if remainder_after_os.startswith(file_type):
                        content_name = remainder_after_os[len(file_type):]
                        return arch, file_type, content_name
            # Fallback: try legacy format without os_type/version
            for file_type in sorted(CLEANUP_FILE_TYPES, key=len, reverse=True):
                if remainder.startswith(file_type):
                    content_name = remainder[len(file_type):]
                    return arch, file_type, content_name
            return arch, None, remainder
    return None, None, repo_name


def cleanup_file(name: str, base_path: str, repo_store_path: str, logger) -> Dict[str, Any]:
    """Cleanup a file artifact.
    
    Routes to appropriate handler:
    - pip_module: Pulp Python repository
    - tarball, git, manifest, ansible_galaxy_collection: Pulp File repository
    
    When called from cleanup_files=all, names are Pulp repo names like
    'x86_64_manifestcalico-v3.30.3'. These are parsed to extract the type
    and content name for correct routing, status updates, and filesystem cleanup.
    """
    # Try parsing as a Pulp repo name (from cleanup_files=all)
    arch, parsed_type, content_name = parse_pulp_file_repo_name(name)

    if parsed_type:
        # Name is a Pulp repo name — use parsed type and content name
        file_type = parsed_type
        pulp_name = name
        artifact_name = content_name
        logger.info(f"Parsed Pulp repo name: arch={arch}, type={file_type}, content={artifact_name}")
    else:
        # Name is a user-provided content name — detect type from filesystem
        file_type = detect_file_type(name)
        pulp_name = None
        artifact_name = name

    # Handle pip modules separately - they use Python repositories
    if file_type == "pip_module":
        return cleanup_pip_module(artifact_name, base_path, repo_store_path, logger, pulp_repo_name=pulp_name)

    # All other file types use Pulp File repository
    return cleanup_file_repository(artifact_name, file_type, base_path, repo_store_path, logger, pulp_repo_name=pulp_name)


# =============================================================================
# FILESYSTEM CONTENT CLEANUP
# =============================================================================

def cleanup_content_directory(content_name: str, content_type: str, repo_store_path: str, logger) -> Dict[str, Any]:
    """Remove uploaded content directory from the filesystem.

    Builds the content path the same way as download_common.py:
        <repo_store_path>/offline_repo/cluster/<arch>/<os_type>/<os_version>/<content_type>/<content_name>

    This mirrors how remove_from_status_files iterates over ARCH_SUFFIXES to
    clean status.csv entries.

    Args:
        content_name: Name of the content item (e.g., 'helm-v3.19.0-amd64')
        content_type: Directory category (tarball, git, pip_module, manifest,
                      ansible_galaxy_collection, rpm_file)
        repo_store_path: Root store path (e.g., '/opt/omnia')
        logger: Logger instance

    Returns:
        Dict with name, type, status, and message keys
    """
    result = {"name": content_name, "type": f"filesystem_{content_type}",
              "status": "Failed", "message": ""}
    removed_dirs = []

    cluster_path = os.path.join(repo_store_path, "offline_repo", "cluster")
    if not os.path.exists(cluster_path):
        result["message"] = f"Content store path not found: {cluster_path}"
        logger.warning(result["message"])
        return result

    # If content_type is None (e.g., from cleanup_files=all when detect_file_type fails),
    # search all known type directories to find and delete the content
    types_to_search = [content_type] if content_type else CLEANUP_FILE_TYPES

    try:
        for arch in ARCH_SUFFIXES:
            # Walk version directories (e.g., rhel/10.0)
            arch_path = os.path.join(cluster_path, arch)
            if not os.path.isdir(arch_path):
                continue

            for version_dir in glob.glob(f"{arch_path}/*/*/"):
                for search_type in types_to_search:
                    content_dir = os.path.join(version_dir, search_type, content_name)
                    if os.path.exists(content_dir):
                        logger.info(f"Removing content directory: {content_dir}")
                        if os.path.isdir(content_dir):
                            shutil.rmtree(content_dir)
                        else:
                            os.remove(content_dir)
                        removed_dirs.append(content_dir)
                        # Remove parent type directory if now empty
                        type_dir = os.path.join(version_dir, search_type)
                        if os.path.isdir(type_dir) and not os.listdir(type_dir):
                            os.rmdir(type_dir)
                            logger.info(f"Removed empty directory: {type_dir}")

        if removed_dirs:
            result["status"] = "Success"
            result["message"] = f"Removed content: {', '.join(removed_dirs)}"
        else:
            result["message"] = (f"No filesystem content found for "
                                 f"'{content_name}' under {types_to_search}")
            logger.info(result["message"])

    except Exception as e:
        result["message"] = f"Filesystem cleanup error: {str(e)}"
        logger.error(f"Failed to cleanup content {content_name}: {e}")

    return result


def cleanup_all_file_content_directories(repo_store_path: str, logger) -> Dict[str, Any]:
    """Remove all file-type content directories from the filesystem.
    
    Called during cleanup_files=all to ensure all locally stored files
    under <repo_store_path>/offline_repo/cluster are deleted.
    
    Walks through all architectures, OS versions, and file-type directories,
    removing all content within each file-type folder.
    
    Args:
        repo_store_path: Root store path (e.g., '/opt/omnia')
        logger: Logger instance
        
    Returns:
        Dict with status and message
    """
    result = {"name": "all_file_content", "type": "filesystem_bulk",
              "status": "Failed", "message": ""}
    removed_dirs = []

    cluster_path = os.path.join(repo_store_path, "offline_repo", "cluster")
    if not os.path.exists(cluster_path):
        result["message"] = f"Content store path not found: {cluster_path}"
        logger.warning(result["message"])
        return result

    try:
        for arch in ARCH_SUFFIXES:
            arch_path = os.path.join(cluster_path, arch)
            if not os.path.isdir(arch_path):
                continue

            for version_dir in glob.glob(f"{arch_path}/*/*/"):
                for file_type in CLEANUP_FILE_TYPES:
                    type_dir = os.path.join(version_dir, file_type)
                    if os.path.isdir(type_dir):
                        # Remove all content within this type directory
                        for item in os.listdir(type_dir):
                            item_path = os.path.join(type_dir, item)
                            logger.info(f"Removing: {item_path}")
                            if os.path.isdir(item_path):
                                shutil.rmtree(item_path)
                            else:
                                os.remove(item_path)
                            removed_dirs.append(item_path)
                        # Remove the empty type directory itself
                        if not os.listdir(type_dir):
                            os.rmdir(type_dir)
                            logger.info(f"Removed empty directory: {type_dir}")

        if removed_dirs:
            result["status"] = "Success"
            result["message"] = f"Removed {len(removed_dirs)} content items from filesystem"
            logger.info(result["message"])
        else:
            result["message"] = "No file content found on filesystem"
            logger.info(result["message"])

    except Exception as e:
        result["message"] = f"Bulk filesystem cleanup error: {str(e)}"
        logger.error(f"Failed bulk filesystem cleanup: {e}")

    return result


# =============================================================================
# STATUS FILE UPDATES
# =============================================================================

def remove_rpms_from_repository(repo_name: str, base_path: str, logger) -> Dict[str, List[str]]:
    """Remove RPMs that belong to a specific repository from status files.

    Uses the repo_name column in status.csv to accurately identify RPMs from the repository.

    Args:
        repo_name: Repository name (e.g., 'x86_64_appstream', 'aarch64_epel')
        base_path: Base path for status files
        logger: Logger instance

    Returns:
        Dict mapping architecture to list of affected software names
    """
    affected_software = {}
    logger.info(f"Removing RPMs from status.csv for repository: {repo_name}")

    # Extract architecture from repo_name (all repo_names should now have arch prefixes)
    target_arch = None
    for arch in ARCH_SUFFIXES:
        if repo_name.startswith(f"{arch}_"):
            target_arch = arch
            break
    
    if not target_arch:
        logger.error(f"Repository name {repo_name} does not have architecture prefix")
        return {}
    
    logger.info(f"Processing architecture: {target_arch}")
    affected_software[target_arch] = []
    
    try:        
        for status_file in glob.glob(f"{base_path}/*/*/{target_arch}/*/status.csv"):
            rows = []
            removed = False
            has_repo_column = False

            # Check if file has repo_name column
            with open(status_file, 'r', encoding='utf-8') as f:
                header = f.readline().strip().lower()
                has_repo_column = "repo_name" in header

            with open(status_file, 'r', encoding='utf-8') as f:
                reader = csv.DictReader(f)
                fieldnames = reader.fieldnames
                for row in reader:
                    name = row.get('name', '')
                    row_type = row.get('type', '')
                    rpm_repo = row.get('repo_name', '')

                    # For RPMs, check if they belong to the deleted repository
                    if row_type in ('rpm', 'rpm_repo', 'rpm_file') and has_repo_column and rpm_repo == repo_name:
                        removed = True
                        logger.info(f"Removing RPM '{name}' from {status_file} (repo {repo_name} deleted)")
                    else:
                        rows.append(row)

            if removed and fieldnames:
                with open(status_file, 'w', newline='', encoding='utf-8') as f:
                    writer = csv.DictWriter(f, fieldnames=fieldnames)
                    writer.writeheader()
                    writer.writerows(rows)

                # Track affected software
                software_name = os.path.basename(os.path.dirname(status_file))
                if software_name not in affected_software[target_arch]:
                    affected_software[target_arch].append(software_name)

        return affected_software
    except Exception as e:
        logger.error(f"Failed to remove RPMs from repository {repo_name}: {e}")
        return {}

def remove_from_status_files(artifact_name: str, artifact_type: str, base_path: str, logger) -> Dict[str, List[str]]:
    """Remove artifact entries from status.csv files and return affected software names.
    
    Removes entries so they are re-downloaded on next local_repo run
    (local_repo processes packages that are Failed or not present in status.csv).
    
    Args:
        artifact_name: Name of the artifact to remove
        artifact_type: Type of artifact (git, tarball, pip_module, image)
        base_path: Base path for status files
        logger: Logger instance
        
    Returns:
        Dict mapping architecture to list of affected software names
    """
    affected_software = {}
    try:
        for arch in ARCH_SUFFIXES:
            arch_affected = []
            for status_file in glob.glob(f"{base_path}/*/*/{arch}/*/status.csv"):
                rows = []
                removed = False
                with open(status_file, 'r', encoding='utf-8') as f:
                    reader = csv.DictReader(f)
                    fieldnames = reader.fieldnames
                    for row in reader:
                        name = row.get('name', '')
                        # Match logic based on type
                        should_remove = False
                        if artifact_type == 'image':
                            # Container images: match with or without tag
                            should_remove = (name == artifact_name or name.startswith(f"{artifact_name}:"))
                        else:
                            # Other types: exact match
                            should_remove = (name == artifact_name)

                        if should_remove:
                            removed = True
                            logger.info(f"Removing '{name}' from {status_file}")
                        else:
                            rows.append(row)

                if removed and fieldnames:
                    with open(status_file, 'w', newline='', encoding='utf-8') as f:
                        writer = csv.DictWriter(f, fieldnames=fieldnames)
                        writer.writeheader()
                        writer.writerows(rows)

                    # Track affected software
                    software_name = os.path.basename(os.path.dirname(status_file))
                    if software_name not in arch_affected:
                        arch_affected.append(software_name)

            if arch_affected:
                affected_software[arch] = arch_affected

        logger.info(f"remove_from_status_files returning: {affected_software}")
        return affected_software
    except OSError as e:
        logger.error(f"Failed to remove from status files: {e}")
        return {}


def mark_software_partial(affected_software, base_path: str, logger, artifact_type: str = None):
    """Mark software entries as partial in software.csv.

    Args:
        affected_software: Either a List[str] of software names (legacy support)
                          or a Dict[str, List[str]] mapping arch to software names
        base_path: Base path for software.csv
        logger: Logger instance
        artifact_type: Type of artifact being removed (for logging purposes)
    """
    logger.info(f"mark_software_partial called with affected_software: {affected_software}")
    if not affected_software:
        logger.info("No affected software to mark as partial")
        return

    # Normalize input: convert to arch_software_map if needed
    if isinstance(affected_software, list):
        logger.warning("Received list input to mark_software_partial, applying to all architectures (legacy behavior)")
        arch_software_map = {arch: affected_software for arch in ARCH_SUFFIXES}
    else:
        arch_software_map = affected_software

    try:
        for arch, software_names in arch_software_map.items():
            if not software_names:
                continue

            for software_file in glob.glob(f"{base_path}/*/*/{arch}/software.csv"):
                logger.info(f"Looking for software file: {software_file}")

                rows = []
                updated = False
                with open(software_file, 'r', encoding='utf-8') as f:
                    reader = csv.DictReader(f)
                    fieldnames = reader.fieldnames
                    for row in reader:
                        if row.get('name') in software_names:
                            row['status'] = 'partial'
                            updated = True
                            logger.info(f"Marked '{row.get('name')}' as partial in {software_file} ({artifact_type} cleanup)")
                        rows.append(row)

                if fieldnames and rows and updated:
                    with open(software_file, 'w', newline='', encoding='utf-8') as f:
                        writer = csv.DictWriter(f, fieldnames=fieldnames)
                        writer.writeheader()
                        writer.writerows(rows)
                    logger.info(f"Successfully wrote updated {software_file}")
    except OSError as e:
        logger.error(f"Failed to update software.csv: {e}")

def software_has_type(software_name: str, arch: str, base_path: str, logger, type_values: tuple) -> bool:
    """Check if a software has entries of given types in its status.csv.
    
    Args:
        software_name: Name of the software
        arch: Architecture (x86_64 or aarch64)
        base_path: Base path for status files
        logger: Logger instance
        type_values: Tuple of type strings to check for (e.g., ('rpm', 'rpm_repo'))
        
    Returns:
        True if software has matching entries, False otherwise
    """
    for status_file in glob.glob(f"{base_path}/*/*/{arch}/{software_name}/status.csv"):
        try:
            with open(status_file, 'r', encoding='utf-8') as f:
                reader = csv.DictReader(f)
                for row in reader:
                    if row.get('type', '').lower() in type_values:
                        return True
        except OSError as e:
            logger.error(f"Error checking {type_values} for {software_name}: {e}")
    return False


def mark_all_software_partial_by_type(base_path: str, logger, type_values: tuple, type_label: str):
    """Mark software entries as partial in software.csv for all architectures.
    
    Only marks software that actually has dependencies of the given types.
    
    Args:
        base_path: Base path for software.csv files
        logger: Logger instance
        type_values: Tuple of type strings to check (e.g., ('rpm', 'rpm_repo'))
        type_label: Human-readable label for logging (e.g., 'RPM', 'container')
    """
    logger.info(f"Marking software with {type_label} dependencies as partial")
    try:
        for arch in ARCH_SUFFIXES:
            for software_file in glob.glob(f"{base_path}/*/*/{arch}/software.csv"):
                logger.info(f"Processing software file: {software_file}")

                rows = []
                updated = False
                with open(software_file, 'r', encoding='utf-8') as f:
                    reader = csv.DictReader(f)
                    fieldnames = reader.fieldnames
                    for row in reader:
                        software_name = row.get('name', '')
                        if row.get('status') == 'success':
                            if software_has_type(software_name, arch, base_path, logger, type_values):
                                row['status'] = 'partial'
                                updated = True
                                logger.info(f"Marked '{software_name}' as partial in {software_file} (has {type_label} deps)")
                            else:
                                logger.info(f"Skipping '{software_name}' - no {type_label} dependencies")
                        rows.append(row)

                if fieldnames and rows and updated:
                    with open(software_file, 'w', newline='', encoding='utf-8') as f:
                        writer = csv.DictWriter(f, fieldnames=fieldnames)
                        writer.writeheader()
                        writer.writerows(rows)
                    logger.info(f"Successfully updated {software_file}")
    except OSError as e:
        logger.error(f"Failed to mark all software as partial ({type_label}): {e}")


def remove_all_from_status_files(artifact_type: str, base_path: str, logger) -> Dict[str, List[str]]:
    """Remove all entries of a given type from status.csv files.
    
    Used by cleanup_containers=all and cleanup_files=all to bulk-remove
    all entries of a specific artifact type from all status.csv files.
    Removed entries will be re-downloaded on next local_repo run.
    
    Args:
        artifact_type: Type of artifact to remove (e.g., 'image', 'tarball', 'git', 'pip_module')
        base_path: Base path for status files
        logger: Logger instance
        
    Returns:
        Dict mapping architecture to list of affected software names
    """
    affected_software = {}
    try:
        for arch in ARCH_SUFFIXES:
            arch_affected = []
            for status_file in glob.glob(f"{base_path}/*/*/{arch}/*/status.csv"):
                rows = []
                removed = False
                with open(status_file, 'r', encoding='utf-8') as f:
                    reader = csv.DictReader(f)
                    fieldnames = reader.fieldnames
                    for row in reader:
                        if row.get('type', '') == artifact_type:
                            removed = True
                            logger.info(f"Removing '{row.get('name', '')}' ({artifact_type}) from {status_file}")
                        else:
                            rows.append(row)

                if removed and fieldnames:
                    with open(status_file, 'w', newline='', encoding='utf-8') as f:
                        writer = csv.DictWriter(f, fieldnames=fieldnames)
                        writer.writeheader()
                        writer.writerows(rows)

                    software_name = os.path.basename(os.path.dirname(status_file))
                    if software_name not in arch_affected:
                        arch_affected.append(software_name)

            if arch_affected:
                affected_software[arch] = arch_affected

        logger.info(f"remove_all_from_status_files({artifact_type}) returning: {affected_software}")
        return affected_software
    except OSError as e:
        logger.error(f"Failed to remove all {artifact_type} from status files: {e}")
        return {}


def write_cleanup_status(results: List[Dict], base_path: str):
    """Write cleanup results to status file."""
    status_file = f"{base_path}/cleanup_status.csv"
    os.makedirs(os.path.dirname(status_file), exist_ok=True)

    with open(status_file, 'w', newline='', encoding='utf-8') as f:
        writer = csv.DictWriter(f, fieldnames=['name', 'type', 'status', 'message'])
        writer.writeheader()
        writer.writerows(results)

    return status_file


def update_metadata_after_cleanup(cleaned_repos: List[str], metadata_file: str, logger,
                                  cleanup_all: bool = False):
    """Remove cleaned-up repository entries from localrepo_metadata.yml.

    For each successfully cleaned repo, find and remove its policy entry
    from the metadata file. Repo names in metadata are normalized
    (hyphens replaced with underscores, suffixed with _policy).

    When cleanup_all is True (i.e. cleanup_repos=all), the entire metadata
    file is deleted.

    Args:
        cleaned_repos: List of repo names that were successfully deleted
        metadata_file: Path to localrepo_metadata.yml
        logger: Logger instance
        cleanup_all: If True, delete the entire metadata file
    """
    if not cleaned_repos or not metadata_file:
        return

    if not os.path.exists(metadata_file):
        logger.info(f"Metadata file not found: {metadata_file}, skipping metadata update")
        return

    try:
        # When cleanup_repos=all, delete the metadata file entirely.
        if cleanup_all:
            os.remove(metadata_file)
            logger.info(f"Deleted metadata file: {metadata_file}")
            return

        with open(metadata_file, 'r', encoding='utf-8') as f:
            metadata = yaml.safe_load(f) or {}

        updated = False
        for repo_name in cleaned_repos:
            # Normalize repo name to match metadata key format: <name>_policy.
            # Metadata may store keys either with arch prefix (e.g., x86_64_doca_policy)
            # or without it (e.g., doca_policy), so try both.
            normalized_name = repo_name.replace('-', '_')
            candidate_policy_keys = {f"{normalized_name}_policy"}
            repo_arch = None
            for arch in ARCH_SUFFIXES:
                arch_prefix = f"{arch}_"
                if normalized_name.startswith(arch_prefix):
                    repo_arch = arch
                    candidate_policy_keys.add(f"{normalized_name[len(arch_prefix):]}_policy")

            def _section_matches_repo_arch(section: str, arch: str) -> bool:
                """Return True if a metadata section belongs to the given arch.

                Expected section naming patterns in localrepo_metadata.yml:
                    - omnia_repo_url_rhel_x86_64 / omnia_repo_url_rhel_aarch64
                    - rhel_subscription_url_x86_64 / rhel_subscription_url_aarch64
                    - user_repo_url_x86_64 / user_repo_url_aarch64
                """
                suffix = f"_{arch}"
                return isinstance(section, str) and section.endswith(suffix)

            # Search through all sections in metadata for these policy keys
            for section_key in list(metadata.keys()):
                if repo_arch and not _section_matches_repo_arch(section_key, repo_arch):
                    continue
                if not isinstance(metadata.get(section_key), dict):
                    continue
                for policy_key in list(candidate_policy_keys):
                    if policy_key in metadata[section_key]:
                        del metadata[section_key][policy_key]
                        updated = True
                        logger.info(
                            f"Removed '{policy_key}' from metadata section '{section_key}'"
                        )
                # Remove the section if it's now empty
                if section_key in metadata and isinstance(metadata[section_key], dict) and not metadata[section_key]:
                    del metadata[section_key]
                    logger.info(f"Removed empty metadata section '{section_key}'")

        if updated:
            with open(metadata_file, 'w', encoding='utf-8') as f:
                yaml.dump(metadata, f, default_flow_style=False)
            logger.info(f"Successfully updated metadata file: {metadata_file}")
        else:
            logger.info("No matching entries found in metadata for cleaned repos")

    except Exception as e:
        logger.error(f"Failed to update metadata after cleanup: {e}")


def remove_repos_from_pulp_repo_file(cleaned_repos: List[str], pulp_repo_file: str, logger):
    """Remove cleaned repository stanzas from a yum repo file (pulp.repo).

    The pulp repo file is an INI-like file with sections such as:
        [repo_name]
        name=...
        baseurl=...

    For each repo in cleaned_repos, remove the entire stanza block.
    If the file becomes empty (no sections remain), remove the file.
    """
    if not cleaned_repos or not pulp_repo_file:
        return

    if not os.path.exists(pulp_repo_file):
        logger.info(f"pulp repo file not found: {pulp_repo_file}, skipping")
        return

    try:
        repo_names = {r.replace('-', '_') for r in cleaned_repos if isinstance(r, str) and r}
        if not repo_names:
            return

        with open(pulp_repo_file, 'r', encoding='utf-8') as f:
            content = f.read()

        # Split into sections keeping headers. Regex finds section headers like [name].
        header_re = re.compile(r'^\[([^\]]+)\]\s*$', re.MULTILINE)
        matches = list(header_re.finditer(content))
        if not matches:
            logger.info(f"No repo sections found in {pulp_repo_file}, skipping")
            return

        kept_blocks: List[str] = []
        removed = 0
        for idx, m in enumerate(matches):
            section_name = m.group(1).strip()
            start = m.start()
            end = matches[idx + 1].start() if idx + 1 < len(matches) else len(content)
            block = content[start:end]

            # Section names in pulp.repo are expected to match Pulp distribution names.
            # Compare normalized (hyphens -> underscores) for safety.
            normalized_section = section_name.replace('-', '_')
            if normalized_section in repo_names:
                removed += 1
                logger.info(f"Removed repo stanza [{section_name}] from {pulp_repo_file}")
                continue

            kept_blocks.append(block.rstrip() + "\n\n")

        new_content = "".join(kept_blocks).strip() + "\n" if kept_blocks else ""
        if not new_content.strip():
            os.remove(pulp_repo_file)
            logger.info(f"Removed empty pulp repo file: {pulp_repo_file}")
            return

        with open(pulp_repo_file, 'w', encoding='utf-8') as f:
            f.write(new_content)
        logger.info(f"Updated pulp repo file: {pulp_repo_file}")

    except PermissionError:
        logger.error(
            f"Permission denied while updating {pulp_repo_file}. Run with elevated privileges."
        )
    except Exception as e:
        logger.error(f"Failed to update {pulp_repo_file} after cleanup: {e}")


# =============================================================================
# MAIN MODULE
# =============================================================================

def run_module():
    """Main module execution."""
    module = AnsibleModule(
        argument_spec=dict(
            cleanup_repos=dict(type='list', elements='str', default=[]),
            cleanup_containers=dict(type='list', elements='str', default=[]),
            cleanup_files=dict(type='list', elements='str', default=[]),
            base_path=dict(
                type='str', default=CLEANUP_BASE_PATH_DEFAULT
            ),
            repo_store_path=dict(
                type='str', default='/opt/omnia'
            ),
            cluster_os_type=dict(
                type='str', required=False, default='rhel'
            ),
            cluster_os_version=dict(
                type='str', required=False, default='10.0'
            ),
            metadata_file=dict(
                type='str', required=False,
                default='/opt/omnia/offline_repo/.data/localrepo_metadata.yml'
            ),
            pulp_repo_file=dict(
                type='str', required=False,
                default='/etc/yum.repos.d/pulp.repo'
            )
        ),
        supports_check_mode=True
    )

    cleanup_repos = module.params['cleanup_repos']
    cleanup_containers = module.params['cleanup_containers']
    cleanup_files = module.params['cleanup_files']
    base_path = module.params['base_path']
    repo_store_path = module.params['repo_store_path']
    cluster_os_type = module.params['cluster_os_type']
    cluster_os_version = module.params['cluster_os_version']
    metadata_file = module.params['metadata_file']
    pulp_repo_file = module.params['pulp_repo_file']

    # Setup logger - setup_standard_logger expects a directory, creates standard.log inside
    log_dir = os.path.join(base_path, cluster_os_type, cluster_os_version, "cleanup")
    os.makedirs(log_dir, exist_ok=True)
    logger = setup_standard_logger(log_dir)

    # Handle 'all' keyword for repositories
    cleanup_all_repos = (
        cleanup_repos and len(cleanup_repos) == 1 and 
        cleanup_repos[0].lower() == 'all'
    )
    if cleanup_all_repos:
        logger.info("cleanup_repos='all' - fetching all repositories from Pulp")
        cleanup_repos = get_all_repositories(logger)
        if not cleanup_repos:
            module.fail_json(
                msg="Failed to retrieve repository list from Pulp. "
                "Please check if Pulp services are running."
            )
        logger.info(f"Found {len(cleanup_repos)} repositories to cleanup: {cleanup_repos}")

    # Handle 'all' keyword for containers
    cleanup_all_containers = (
        cleanup_containers and len(cleanup_containers) == 1 and
        cleanup_containers[0].lower() == 'all'
    )
    if cleanup_all_containers:
        logger.info("cleanup_containers='all' - fetching all container repositories from Pulp")
        cleanup_containers = get_all_containers(logger)
        if not cleanup_containers:
            module.fail_json(
                msg="Failed to retrieve container repository list from Pulp. "
                "Please check if Pulp services are running."
            )
        logger.info(f"Found {len(cleanup_containers)} containers to cleanup: {cleanup_containers}")

    # Handle 'all' keyword for files
    cleanup_all_files = (
        cleanup_files and len(cleanup_files) == 1 and
        cleanup_files[0].lower() == 'all'
    )
    if cleanup_all_files:
        logger.info("cleanup_files='all' - fetching all file and Python repositories from Pulp")
        file_repos = get_all_file_repositories(logger)
        python_repos = get_all_python_repositories(logger)
        cleanup_files = file_repos + python_repos
        if not cleanup_files:
            module.fail_json(
                msg="Failed to retrieve file/Python repository list from Pulp. "
                "Please check if Pulp services are running."
            )
        logger.info(f"Found {len(cleanup_files)} file repos to cleanup: {cleanup_files}")

    logger.info(
        f"Starting cleanup - repos: {cleanup_repos}, "
        f"containers: {cleanup_containers}, files: {cleanup_files}"
    )

    all_results = []

    # Process repositories
    for repo in cleanup_repos:
        result = cleanup_repository(repo, base_path, logger)
        all_results.append(result)
        logger.info(f"Repository {repo}: {result['status']} - {result['message']}")

    # If cleanup_repos=all, mark software with RPM dependencies as partial
    if cleanup_all_repos and any(r['status'] == 'Success' for r in all_results if r['type'] == 'repository'):
        mark_all_software_partial_by_type(base_path, logger, ('rpm', 'rpm_repo'), 'RPM')

    # Process containers
    container_cleanup_success = False
    for container in cleanup_containers:
        result = cleanup_container(container, base_path, logger)
        all_results.append(result)
        if result['status'] == 'Success':
            container_cleanup_success = True
        logger.info(f"Container {container}: {result['status']} - {result['message']}")

    # If cleanup_containers=all, bulk-remove all image entries from status files and mark software partial
    if cleanup_all_containers and container_cleanup_success:
        remove_all_from_status_files('image', base_path, logger)
        mark_all_software_partial_by_type(base_path, logger, ('image',), 'container')

    # Process files
    file_cleanup_success = False
    for file in cleanup_files:
        result = cleanup_file(file, base_path, repo_store_path, logger)
        all_results.append(result)
        if result['status'] == 'Success':
            file_cleanup_success = True
        logger.info(f"File {file}: {result['status']} - {result['message']}")

    # If cleanup_files=all, bulk-remove all file-type entries from status files,
    # clean all local file content directories, and mark software partial
    if cleanup_all_files and file_cleanup_success:
        for ftype in CLEANUP_FILE_TYPES:
            remove_all_from_status_files(ftype, base_path, logger)
        cleanup_all_file_content_directories(repo_store_path, logger)
        mark_all_software_partial_by_type(base_path, logger, tuple(CLEANUP_FILE_TYPES), 'file')

    # Update metadata file to remove entries for successfully cleaned repos
    successfully_cleaned = [r['name'] for r in all_results if r['status'] == 'Success']
    if successfully_cleaned and metadata_file:
        update_metadata_after_cleanup(successfully_cleaned, metadata_file, logger,
                                          cleanup_all=cleanup_all_repos)

    # Update yum repo file (pulp.repo) to remove stanzas for successfully cleaned repositories
    cleaned_repo_names = [r['name'] for r in all_results if r['status'] == 'Success' and r.get('type') == 'repository']
    if cleaned_repo_names and pulp_repo_file:
        remove_repos_from_pulp_repo_file(cleaned_repo_names, pulp_repo_file, logger)

    # Run orphan cleanup once after all deletions to reclaim disk space
    any_success = any(r['status'] == 'Success' for r in all_results)
    if any_success:
        logger.info("Running global orphan cleanup to reclaim disk space...")
        orphan_result = run_cmd(pulp_rpm_commands["orphan_cleanup"], logger)
        if orphan_result["rc"] == 0:
            logger.info("Orphan cleanup completed successfully")
        else:
            logger.warning(f"Orphan cleanup warning: {orphan_result['stderr']}")

    # Write status file
    status_file = write_cleanup_status(all_results, log_dir)

    # Calculate summary
    total = len(all_results)
    success = len([r for r in all_results if r['status'] == 'Success'])
    failed = len([r for r in all_results if r['status'] == 'Failed'])

    # Generate pretty table
    pretty_table = format_pretty_table(all_results)

    logger.info(f"Cleanup completed - Total: {total}, Success: {success}, Failed: {failed}")

    module.exit_json(
        changed=success > 0,
        results=all_results,
        total=total,
        success_count=success,
        failed_count=failed,
        summary=f"Total: {total}, Success: {success}, Failed: {failed}",
        pretty_table=pretty_table,
        pretty_table_lines=pretty_table.split('\n'),
        status_file=status_file
    )


if __name__ == '__main__':
    run_module()


================================================
FILE: common/library/modules/read_idracips_from_mysqldb.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

#!/usr/bin/python
"""Module to read iDRAC IPs from MySQL database.
This module connects to a Kubernetes pod running MySQL and retrieves iDRAC IPs
from the 'services' table. It handles retries and delays for robustness."""
import time
from ansible.module_utils.basic import AnsibleModule
from kubernetes import client, config
from kubernetes.stream import stream

def load_kube_context():
    """Load Kubernetes configuration for accessing the cluster."""
    try:
        config.load_kube_config()
    except Exception:
        config.load_incluster_config()


# Function to execute a MySQL command inside a pod using the Kubernetes client
def run_mysql_query_in_pod(namespace, pod, container, mysql_user, mysql_password, query):
    """Run a MySQL query in the specified pod."""
    core_v1 = client.CoreV1Api()
    mysql_command = [
        "mysql",
        "-u", mysql_user,
        "-N", "-B",
        f"-p{mysql_password}",
        "-e", query
    ]

    try:
        ws = stream(
            core_v1.connect_get_namespaced_pod_exec,
            name=pod,
            namespace=namespace,
            container=container,
            command=mysql_command,
            stderr=True,
            stdin=False,
            stdout=True,
            tty=False,
            _preload_content=False  # Allow access to return code and streaming output
        )

        stdout = ""
        stderr = ""

        while ws.is_open():
            ws.update(timeout=1)
            if ws.peek_stdout():
                stdout += ws.read_stdout()
            if ws.peek_stderr():
                stderr += ws.read_stderr()
        ws.close()

        rc = ws.returncode

        if rc != 0:
            return {
                "rc": rc,
                "result": stderr.strip() if stderr else "Unknown error"
              }  # Or return stderr if you want to inspect/log errors

        # Clean and filter result
        query_result = [
            line.strip() for line in stdout.strip().splitlines()
            if line.strip() and not line.strip().startswith("mysql:")
        ]

        return {
            "rc": rc,
            "result": query_result
        }

    except Exception as e:
        return {
         "rc": 1,
         "result": str(e)   
        }

def main():
    """Main function to execute the module logic."""
    module_args = {
        "telemetry_namespace": {"type": "str", "required": True},
        "idrac_podnames": {"type": "list", "required": True},
        "mysqldb_k8s_name": {"type": "str", "required": True},
        "mysqldb_name": {"type": "str", "required": True},
        "mysqldb_user": {"type": "str", "required": True, "no_log": True},
        "mysqldb_password": {"type": "str", "required": True, "no_log": True},
        "db_retries": {"type": "int", "default": 5},
        "db_delay": {"type": "int", "default": 3},
    }

    module = AnsibleModule(argument_spec=module_args, supports_check_mode=True)

    telemetry_namespace = module.params["telemetry_namespace"]
    idrac_podnames = module.params["idrac_podnames"]
    mysqldb_k8s_name = module.params["mysqldb_k8s_name"]
    mysqldb_name = module.params["mysqldb_name"]
    mysqldb_user = module.params["mysqldb_user"]
    mysqldb_password = module.params["mysqldb_password"]
    db_retries = module.params["db_retries"]
    db_delay = module.params["db_delay"]

    load_kube_context()

    services_table_exists = {}
    db_idrac_ips = {}
    mysqldb_idrac_ips = []

    try:
        for idrac_podname in idrac_podnames:
            found = None
            ip_output = None
            ip_list = []

            for _ in range(db_retries):
                # Check for services table
                query_tables = f"SHOW TABLES FROM {mysqldb_name}"
                tables_output = run_mysql_query_in_pod(
                    telemetry_namespace,
                    idrac_podname,
                    mysqldb_k8s_name,
                    mysqldb_user,
                    mysqldb_password,
                    query_tables
                )
                if tables_output and not found:
                    found = tables_output

                # Fetch iDRAC IPs if table exists
                if found and not ip_output:
                    query_ips = f"SELECT ip FROM {mysqldb_name}.services"
                    ip_output = run_mysql_query_in_pod(
                        telemetry_namespace,
                        idrac_podname,
                        mysqldb_k8s_name,
                        mysqldb_user,
                        mysqldb_password,
                        query_ips
                    )
                    module.warn(f"iDRAC IPs output from {idrac_podname}: {ip_output}")
                if ip_output.get("rc") == 0:
                    ip_list = ip_output.get("result", [])
                    module.warn(f"iDRAC IPs found in {idrac_podname}: {ip_list}")
                    break

                time.sleep(db_delay)

            services_table_exists[idrac_podname] = found

            # Parse iDRAC IPs
            if ip_list:
                db_idrac_ips[idrac_podname] = ip_list
                mysqldb_idrac_ips.extend(ip_list)
            else:
                db_idrac_ips[idrac_podname] = []

        if not any(services_table_exists.values()):
            module.warn("Failed to find 'services' table in any of the MySQL pods.")

        if not any(db_idrac_ips.values()):
            module.warn("Failed to fetch iDRAC IPs from any pod.")

        module.exit_json(
            changed=False,
            mysqldb_idrac_ips=mysqldb_idrac_ips,
            pod_to_db_idrac_ips=db_idrac_ips,
            services_table_check=services_table_exists
        )
    except Exception as e:
        module.fail_json(
            msg=f"An error occurred while reading iDRAC IPs from MySQL: {str(e)}",
            mysqldb_idrac_ips=[],
            services_table_check=services_table_exists,
            pod_to_db_idrac_ips=db_idrac_ips
        )


if __name__ == "__main__":
    main()


================================================
FILE: common/library/modules/slurm_conf.py
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

import os
from collections import OrderedDict
from ansible.module_utils.basic import AnsibleModule
from ansible.module_utils.input_validation.common_utils.slurm_conf_utils import (
    SlurmParserEnum,
    all_confs,
    parse_slurm_conf
)

DOCUMENTATION = r'''
---
module: slurm_conf
short_description: Parse, convert, and merge Slurm configuration files
version_added: "1.0.0"
description:
    - This module provides utilities for working with Slurm configuration files.
    - It can parse a Slurm conf file into a dictionary (parse).
    - It can convert a dictionary back to Slurm conf INI format (render).
    - It can merge multiple configuration sources (files and/or dicts) into one (merge).
options:
    op:
        description:
            - The operation to perform.
            - C(parse) - File to dict. Parse a Slurm conf file and return as dictionary.
            - C(render) - Dict to file. Convert a dictionary to Slurm conf INI lines.
            - C(merge) - Merge multiple configuration sources into one.
        required: true
        type: str
        choices: ['parse', 'render', 'merge']
    path:
        description:
            - Path to the Slurm configuration file.
            - Required when I(op=parse).
        type: str
    conf_map:
        description:
            - Dictionary of configuration key-value pairs.
            - Required when I(op=render).
        type: dict
        default: {}
    conf_sources:
        description:
            - List of configuration sources to merge.
            - Each source can be a file path (string) or a dictionary of config values.
            - Sources are merged in order, with later sources overriding earlier ones.
            - Required when I(op=merge).
        type: list
        elements: raw
        default: []
    conf_name:
        description:
            - The type of Slurm configuration file being processed.
            - Used for validation of configuration keys.
        type: str
        default: slurm
author:
    - Jagadeesh N V (@jagadeeshnv)
'''

EXAMPLES = r'''
# Parse a slurm.conf file into a dictionary
- name: Read slurm.conf
  slurm_conf:
    op: parse
    path: /etc/slurm/slurm.conf
    conf_name: slurm
  register: slurm_config

# Convert a dictionary to slurm.conf INI lines
- name: Generate slurm.conf lines
  slurm_conf:
    op: render
    conf_map:
      ClusterName: mycluster
      SlurmctldPort: 6817
      SlurmctldHost:
        - controller2
      NodeName:
        - NodeName: node[1-10]
          CPUs: 16
          RealMemory: 64000
  register: conf_lines

# Merge a base config file with custom overrides
- name: Merge configurations
  slurm_conf:
    op: merge
    conf_sources:
      - /etc/slurm/slurm.conf.base
      - SlurmctldTimeout: 120
        SlurmdTimeout: 300
      - NodeName:
          - NodeName: newnode1
            CPUs: 32
    conf_name: slurm
  register: merged_config

# Merge multiple config files
- name: Merge multiple files
  slurm_conf:
    op: merge
    conf_sources:
      - /etc/slurm/slurm.conf.defaults
      - /etc/slurm/slurm.conf.site
      - /etc/slurm/slurm.conf.local
    conf_name: slurm
  register: merged_config
'''

RETURN = r'''
conf_dict:
    description: Merged configuration as a dictionary (when op=merge or op=parse).
    type: dict
    returned: when op=merge or op=parse
    sample: {"ClusterName": "mycluster", "SlurmctldTimeout": 120}
ini_lines:
    description: Merged configuration as INI-format lines (when op=merge or op=render).
    type: list
    returned: when op=merge or op=render
    sample: ["ClusterName=mycluster", "SlurmctldTimeout=120"]
'''

# TODO:
#   - Module is not case sensitive for conf keys
#   - Support for validation of S_P_<data> types
#   - Validation for choices for each type
#   - Choices types for each type
#   - Merge of sub options
#   - Hostlist expressions, split and merge computations


def read_dict2ini(conf_dict):
    """Convert a configuration dictionary to INI-style lines for slurm.conf."""
    data = []
    for k, v in conf_dict.items():
        if isinstance(v, list):
            for dct_item in v:
                if isinstance(dct_item, dict):
                    od = OrderedDict(dct_item)
                    od.move_to_end(k, last=False)  # Move k to the beginning
                    data.append(
                        " ".join(f"{key}={value}" for key, value in od.items()))
                else:
                    data.append(f"{k}={dct_item}")
        else:
            data.append(f"{k}={v}")
    return data


def slurm_conf_dict_merge(conf_dict_list, conf_name, replace):
    """Merge multiple Slurm configuration dictionaries into a single dictionary."""
    merged_dict = OrderedDict()
    current_conf = all_confs.get(conf_name, {})
    for conf_dict in conf_dict_list:
        for ky, vl in conf_dict.items():
            if current_conf.get(ky) == SlurmParserEnum.S_P_ARRAY:
                for item in vl:
                    if isinstance(item, dict):
                        existing_dict = merged_dict.get(ky, {})
                        inner_dict = existing_dict.get(item.get(ky), {})
                        # Get the sub-options for this array type (e.g., nodename_options, partition_options)
                        sub_options = all_confs.get(f"{conf_name}->{ky}", {})
                        # Merge item into inner_dict, handling CSV fields specially
                        for k, v in item.items():
                            if sub_options.get(k) == SlurmParserEnum.S_P_CSV and k in inner_dict and not replace:
                                # Merge CSV values
                                existing_values = [val.strip() for val in inner_dict[k].split(',') if val.strip()]
                                new_values = [val.strip() for val in v.split(',') if val.strip()]
                                inner_dict[k] = ",".join(list(dict.fromkeys(existing_values + new_values)))
                            else:
                                # Regular update for non-CSV fields
                                inner_dict[k] = v
                        existing_dict[item.get(ky)] = inner_dict
                        merged_dict[ky] = existing_dict
            elif current_conf.get(ky) == SlurmParserEnum.S_P_LIST:
                existing_list = merged_dict.get(ky, [])
                if isinstance(vl, list):
                    new_items = vl
                else:
                    new_items = [vl]
                merged_dict[ky] = list(dict.fromkeys(existing_list + new_items))
            elif current_conf.get(ky) == SlurmParserEnum.S_P_CSV and not replace:
                existing_values = [v.strip() for v in merged_dict.get(ky, "").split(',') if v.strip()]
                new_values = [v.strip() for v in vl.split(',') if v.strip()]
                merged_dict[ky] = ",".join(list(dict.fromkeys(existing_values + new_values)))
            else:
                merged_dict[ky] = vl
    # flatten the dict
    merged_dict = {
        k: list(v.values()) if isinstance(v, dict) else v
        for k, v in merged_dict.items()
    }
    return merged_dict


def run_module():
    """Entry point for the Ansible module handling slurm.conf operations."""
    module_args = {
        "path": {'type': 'str'},
        "op": {'type': 'str', 'required': True, 'choices': ['parse', 'render', 'merge']},
        "conf_map": {'type': 'dict', 'default': {}},
        "conf_sources": {'type': 'list', 'elements': 'raw', 'default': []},
        "conf_name": {'type': 'str', 'default': 'slurm'},
        "validate": {'type': 'bool', 'default': False},
        "replace": {'type': 'bool', 'default': False}
    }

    result = {"changed": False, "failed": False}

    # Create the AnsibleModule object
    module = AnsibleModule(argument_spec=module_args,
                           required_if=[
                               ('op', 'render', ('conf_map',)),
                               ('op', 'merge', ('conf_sources',))
                           ],
                           supports_check_mode=True)
    try:
        conf_name = module.params['conf_name']
        validate = module.params['validate']
        replace = module.params['replace']
        # Parse the slurm.conf file
        if module.params['op'] == 'parse':
            s_dict, dup_keys = parse_slurm_conf(module.params['path'], conf_name, validate)
            if dup_keys:
                module.fail_json(msg=f"Duplicate keys found in {module.params['path']}: {dup_keys}")
            result['conf_dict'] = s_dict
        elif module.params['op'] == 'render':
            s_list = read_dict2ini(module.params['conf_map'])
            result['ini_lines'] = s_list
        elif module.params['op'] == 'merge':
            conf_dict_list = []
            for conf_source in module.params['conf_sources']:
                if isinstance(conf_source, dict):
                    conf_dict_list.append(OrderedDict(conf_source))
                elif isinstance(conf_source, str):
                    if not os.path.exists(conf_source):
                        raise FileNotFoundError(f"File {conf_source} does not exist")
                    s_dict, dup_keys = parse_slurm_conf(conf_source, conf_name, validate)
                    if dup_keys:
                        module.fail_json(msg=f"Duplicate keys found in {conf_source}: {dup_keys}")
                    conf_dict_list.append(OrderedDict(s_dict))
                else:
                    raise TypeError(f"Invalid type for conf_source: {type(conf_source)}")
            merged_dict = slurm_conf_dict_merge(conf_dict_list, conf_name, replace)
            result['conf_dict'] = merged_dict
            result['ini_lines'] = read_dict2ini(merged_dict)
    except (FileNotFoundError, ValueError, TypeError, AttributeError) as e:
        result['failed'] = True
        result['msg'] = str(e)
        module.fail_json(msg=str(e))
    module.exit_json(**result)


if __name__ == '__main__':
    run_module()


================================================
FILE: common/library/modules/update_bmc_group_entry.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

#!/usr/bin/python
""" Ansible module to update BMC group entry in CSV file. """
import csv
import os
import requests
from requests.auth import HTTPBasicAuth
from ansible.module_utils.basic import AnsibleModule
from requests import packages
from requests.exceptions import (
    ConnectionError as RequestsConnectionError,
    ConnectTimeout,
    HTTPError,
    Timeout,
    RequestException
)
packages.urllib3.disable_warnings()

def is_bmc_reachable_or_auth(ip, username, password, module):
    """
    Check if the BMC is reachable and if the credentials are valid.
    Returns True if reachable and authenticated, False otherwise.
    """
    url = f"https://{ip}/redfish/v1/"
    try:
        response = requests.get(
            url,
            auth=HTTPBasicAuth(username, password),
            timeout=30,
            verify=False
        )

        if response.status_code == 200:
            return True, 200
        if response.status_code == 401:
            module.warn(f"BMC IP {ip} is reachable, but bmc credential is invalid.")
            return False, 401
        if response.status_code == 404:
            module.warn(f"BMC IP {ip} is reachable, but Redfish API not found (404).")
            return False, 404

        module.warn(f"BMC IP {ip} responded with unexpected status code: {response.status_code}")
        return False, response.status_code

    except ConnectTimeout:
        module.warn(f"BMC IP {ip} connection timed out. Not reachable.")
    except HTTPError as http_err:
        module.warn(f"BMC IP {ip} HTTP error occurred: {http_err}")
    except RequestsConnectionError:
        module.warn(f"BMC IP {ip} is unreachable (connection error).")
    except Timeout:
        module.warn(f"BMC IP {ip} request timed out.")
    except RequestException as req_err:
        module.warn(f"BMC IP {ip} encountered a request error: {req_err}")

    return False, 500  # Return 500 for general errors

def read_entries_csv(csv_path, module):
    "Reading existing entries from the CSV file"
    entries = {}
    expected_columns = {'BMC_IP', 'GROUP_NAME', 'PARENT'}

    if os.path.exists(csv_path):
        try:
            with open(csv_path, mode='r', encoding='utf-8') as csvfile:
                reader = csv.DictReader(csvfile)

                actual_columns = set(reader.fieldnames or [])
                if not actual_columns:
                    return entries
                if expected_columns != actual_columns:
                    module.fail_json(
                        msg=f"CSV file at {csv_path} is missing required columns. \
                            Expected: {expected_columns}, \
                            Found: {actual_columns}"
                    )

                for row in reader:
                    if not row['BMC_IP']:
                        module.fail_json(
                            msg=f"CSV file at {csv_path} contains an entry with an empty 'BMC_IP'."
                        )
                    entries[row['BMC_IP']] = row
        except csv.Error as e:
            module.fail_json(msg=f"Failed to parse CSV file at {csv_path}: {str(e)}")

    return entries


def write_entries_csv(csv_path, entries):
    "Writing BMC with group details entries to the CSV file"
    os.makedirs(os.path.dirname(csv_path), exist_ok=True)
    with open(csv_path, mode='w', newline='', encoding='utf-8') as csvfile:
        fieldnames = ['BMC_IP', 'GROUP_NAME', 'PARENT']
        writer = csv.DictWriter(csvfile, fieldnames=fieldnames)
        writer.writeheader()
        for entry in entries.values():
            writer.writerow(entry)

def delete_bmc_entries(nodes, existing_entries, result):
    """
    Delete BMC entries from the existing entries based on the provided nodes.
    """
    for node in nodes:
        bmc_ip = node.get('bmc_ip')
        if bmc_ip in existing_entries:
            del existing_entries[bmc_ip]
            result['deleted'].append(bmc_ip)
            result['changed'] = True

def add_bmc_entries(nodes, existing_entries, bmc_creds, module, result):
    """
    Add BMC entries to the existing entries based on the provided nodes.
    """
    for node in nodes:
        bmc_ip = node.get('bmc_ip')
        group = node.get('group_name', '')
        parent = node.get('parent', '')

        if bmc_ip and bmc_ip not in existing_entries:
            is_valid, code = is_bmc_reachable_or_auth(bmc_ip, bmc_creds.get('username'),
                                                      bmc_creds.get('password'), module)
            if is_valid:
                existing_entries[bmc_ip] = {
                    'BMC_IP': bmc_ip,
                    'GROUP_NAME': group,
                    'PARENT': parent
                }
                result['added'].append(bmc_ip)
            else:
                if code == 401:
                    result['invalid_creds'].append(bmc_ip)
                elif code == 404:
                    result['redfish_disabled'].append(bmc_ip)
                else:
                    result['unreachable_bmc'].append(bmc_ip)
            result['changed'] = True

def verify_bmc_entries(nodes, bmc_creds, module, result):
    """
    Verify reachability and authentication of BMC entries in the existing entries.
    """

    for node in nodes:
        bmc_ip = node.get('bmc_ip')
        is_valid, code = is_bmc_reachable_or_auth(bmc_ip, bmc_creds.get('username'),
                                                  bmc_creds.get('password'), module)
        if is_valid:
            result['verified_bmc'].append(bmc_ip)
        else:
            if code == 401:
                result['invalid_creds'].append(bmc_ip)
            elif code == 404:
                result['redfish_disabled'].append(bmc_ip)
            else:
                result['unreachable_bmc'].append(bmc_ip)
    result['changed'] = True


def main():
    "Main function for the custom ansible module - update_bmc_group_entry"
    module_args = {
        'csv_path': {'type': 'str', 'required': False, 'default': '/opt/omnia/telemetry/bmc_group_entries.csv' },
        'nodes': {'type': 'list', 'elements': 'dict', 'required': False, 'default': []},
        'bmc_username': {'type': 'str', 'required': False, 'no_log': True},
        'bmc_password': {'type': 'str', 'required': False, 'no_log': True},
        'delete': {'type': 'bool', 'default': False, 'required': False},
        'verify_bmc': {'type': 'bool', 'default': False, 'required': False}
    }

    result = {'changed': False, 'added': [], 'deleted': [], 'invalid_creds': [],
              'unreachable_bmc': [], 'redfish_disabled': [], 'verified_bmc': []}

    module = AnsibleModule(argument_spec=module_args, supports_check_mode=False)

    csv_path = module.params['csv_path']
    nodes = module.params['nodes']
    delete = module.params['delete']
    verify_bmc = module.params['verify_bmc']
    bmc_creds = {}
    bmc_creds['username'] = module.params.get('bmc_username')
    bmc_creds['password'] = module.params.get('bmc_password')

    # Validate username and password only if delete is False
    if not delete and (not bmc_creds.get('username') or not bmc_creds.get('password')):
        module.fail_json(msg="bmc_username and bmc_password are mandatory for add operation.")

    existing_entries = read_entries_csv(csv_path, module)

    if delete:
        delete_bmc_entries(nodes, existing_entries, result)
        write_entries_csv(csv_path, existing_entries)
    elif verify_bmc:
        verify_bmc_entries(nodes, bmc_creds, module, result)
    else:
        add_bmc_entries(nodes, existing_entries, bmc_creds, module, result)
        write_entries_csv(csv_path, existing_entries)
    module.exit_json(**result)

if __name__ == '__main__':
    main()


================================================
FILE: common/library/modules/validate_bmc_group_data.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

# pylint: disable=import-error,no-name-in-module,line-too-long

#!/usr/bin/python

"""Ansible module to check telemetry service cluster node details."""

import re
from ansible.module_utils.basic import AnsibleModule

def is_valid_ip(ip):
    """
    This function checks if the given IP address is valid.
    Parameters:
        ip (str): IP address to be validated.
    Returns:
        bool: True if IP address is valid, False otherwise.
    """
    return re.match(r'^\d{1,3}(\.\d{1,3}){3}$', ip)

def validate_bmc_group_data(bmc_group_data, bmc_group_data_headers, bmc_group_data_file, nodes_bmc_ips):
    """
    Validates BMC group data and returns the result along with the list of BMC IPs.

    Parameters:
        bmc_group_data (list): List of BMC group data entries.
        bmc_group_data_headers (list): List of expected headers in BMC group data.
        bmc_group_data_file (str): The file containing BMC group data.

    Returns:
        dict: A dictionary containing the validation result, list of BMC IPs and other relevant information.
    """
    invalid_bmc_group_data_file_msg = f"Invalid BMC group data file {bmc_group_data_file}. Please execute discovery_provision.yml to Generate valid BMC data file."
    if not bmc_group_data:
        raise ValueError("BMC group data is empty")
    headers = bmc_group_data[0].split(',')

    if headers != bmc_group_data_headers:
        raise ValueError(f"Failed. Invalid headers in BMC group data file. Expected: {bmc_group_data_headers}, Found: {headers}. {invalid_bmc_group_data_file_msg}")
    bmc_dict_list = []
    invalid_ip = []
    external_ip = []

    if not bmc_group_data[1:]:
        raise ValueError(f"Failed. No BMC entries found in BMC group data file {bmc_group_data_file}")

    for line in bmc_group_data[1:]:
        values = line.split(',')
        entry = dict(zip(headers, values))
        ip = entry.get('BMC_IP', '')
        if not is_valid_ip(ip):
            invalid_ip.append(ip)
        if ip not in nodes_bmc_ips:
            if entry.get('PARENT') or entry.get('GROUP_NAME'):
                external_ip.append(ip)
        bmc_dict_list.append(entry)

    if invalid_ip:
        raise ValueError(f"Failed. Invalid BMC_IP: {invalid_ip} found in {bmc_group_data_file}")

    if external_ip:
        raise ValueError(f"Failed. BMC_IP not found in omniadb: {external_ip}. For EXTERNAL IPs, 'PARENT' and 'GROUP_NAME' should not be set in {bmc_group_data_file}")

    result = {
        "changed": False,
        "bmc_dict_list": bmc_dict_list,
        "bmc_ips": {},
        "msg": ""
    }

    sn_bmc_ips = {}
    for entry in bmc_dict_list:
        parent = entry.get('PARENT')
        if parent:
            sn_bmc_ips.setdefault(parent, []).append(entry['BMC_IP'])

    mgmt_bmc_ips = [entry['BMC_IP'] for entry in bmc_dict_list if not entry.get('PARENT')]
    result['bmc_ips'] = {**sn_bmc_ips, 'MGMT_node': mgmt_bmc_ips}


    return result


def main():
    """
    Main function for the Ansible module.
    """
    module_args = {
        "nodes_bmc_ips": {"type": "list", "elements": "str", "required": True},
        "bmc_group_data": {"type": "list", "elements": "str", "required": True},
        "bmc_group_data_headers": {"type": "list", "elements": "str", "required": True},
        "bmc_group_data_file": {"type": "str", "required": False}
    }

    module = AnsibleModule(
        argument_spec=module_args,
        supports_check_mode=True
    )
    nodes_bmc_ips = module.params['nodes_bmc_ips']
    bmc_group_data = module.params['bmc_group_data']
    bmc_group_data_headers = module.params['bmc_group_data_headers']
    bmc_group_data_file = module.params['bmc_group_data_file']
    try:
        result = validate_bmc_group_data(bmc_group_data, bmc_group_data_headers, bmc_group_data_file, nodes_bmc_ips)
        module.exit_json(**result)
    except ValueError as e:
        module.fail_json(msg=f"BMC Group Data Validation failed: {str(e)}")

if __name__ == '__main__':
    main()


================================================
FILE: common/library/modules/validate_credentials.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

# pylint: disable=unused-import,line-too-long
#!/usr/bin/python

""" This module is used to validate credentials"""

import json
import os
import re
from configparser import ConfigParser

from ansible.module_utils.basic import AnsibleModule


def load_rules(file_path):
    """Loads validation rules from a JSON file."""
    with open(file_path, 'r', encoding='utf-8') as file:
        return json.load(file)

def validate_input(field, value, rules):
    """Validates input against rules."""
    if field not in rules:
        return (False, f"Validation rules not found for '{field}'")
    rule = rules[field]
    if not rule["minLength"] <= len(value) <= rule["maxLength"]:
        return (False, f"'{field}' length must be between {rule['minLength']} and {rule['maxLength']} characters")
    if "pattern" in rule and not re.match(rule["pattern"], value):
        return (False, f"'{field}' format is invalid. Description: {rule['description']}")
    return (True, f"'{field}' is valid")

def main():
    """Main module function."""
    module_args = {
        "credential_field": {"type": "str", "required": True},
        "credential_input": {"type": "str", "required": True},
        "module_utils_path": {"type": "str", "required": False, "default": None}
    }

    module = AnsibleModule(argument_spec=module_args, supports_check_mode=True)
    params = module.params
    module_utils_base = module.params["module_utils_path"]
    credentials_schema = os.path.join(module_utils_base,'input_validation','schema',\
                                      'credential_rules.json')
    # Load validation rules
    try:
        rules = load_rules(credentials_schema)
    except ValueError as e:
        module.fail_json(msg=f"Failed to load rules: {e}")

    # Validate credential
    credential_valid, credential_msg = validate_input(params["credential_field"], \
                                                      params["credential_input"], rules)

    if credential_valid:
        module.exit_json(changed=False, msg=f"{credential_msg}")
    else:
        module.fail_json(msg=f"Validation failed: {credential_msg}")

if __name__ == "__main__":
    main()


================================================
FILE: common/library/modules/validate_input.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

#!/usr/bin/python

"""
This module is used to validate input data.

It provides functions for verifying and validating input data, and also includes
functions for fetching and validating data.

Functions:
    validate_input
    get_data
    verify
"""

import logging
import os

# pylint: disable=no-name-in-module,E0401
import ansible.module_utils.input_validation.common_utils.data_fetch as fetch
import ansible.module_utils.input_validation.common_utils.data_validation as validate
import ansible.module_utils.input_validation.common_utils.data_verification as verify
from ansible.module_utils.basic import AnsibleModule
from ansible.module_utils.input_validation.common_utils import config
from ansible.module_utils.input_validation.common_utils import en_us_validation_msg

def createlogger(project_name, tag_name=None):
    """
    Creates a logger object for the given project name and tag name.

    Args:
        project_name (str): The name of the project.
        tag_name (str, optional): The name of the tag. Defaults to None.

    Returns:
        logging.Logger: The logger object.
    """
    if tag_name:
        log_filename = f"{tag_name}_validation_omnia_{project_name}.log"
    else:
        log_filename = f"validation_omnia_{project_name}.log"

    log_file_path = os.path.join(config.INPUT_VALIDATOR_LOG_PATH, log_filename)
    logging.basicConfig(
        filename=log_file_path,
        format="%(asctime)s %(message)s",
        filemode="w"
    )
    logger = logging.getLogger(tag_name if tag_name else project_name)
    logger.setLevel(logging.DEBUG)
    return logger

def main():
    """
    The main function that runs the input validation.

    This function initializes the logger, verifies the existence of the specified directory,
    retrieves the list of JSON and YAML files, and sets up the schema and input data dictionaries.

    It then runs the validation for each file based on the specified tag names.
    The validation includes schema validation (L1) and logic validation (L2).
    """
    module_args = {
        "omnia_base_dir": {"type": "str", "required": True},
        "project_name": {"type": "str", "required": True},
        "tag_names": {"type": "list", "required": True},
        "module_utils_path": {"type": "str"}
    }

    module = AnsibleModule(argument_spec=module_args, supports_check_mode=True)
    
    module_utils_base = module.params["module_utils_path"]
    omnia_base_dir = module.params["omnia_base_dir"]
    project_name = module.params["project_name"]
    tag_names = module.params["tag_names"]

    schema_base_file_path = os.path.join(module_utils_base,'input_validation','schema')
    input_dir_path = os.path.join(omnia_base_dir, project_name)
    input_files = []

    input_file_inventory = config.input_file_inventory
    passwords_set = config.passwords_set
    extensions = config.extensions

    validation_status = {"tag": tag_names, "Passed": [], "Failed": []}
    vstatus = []

    logger = createlogger(project_name)

    # Start validation execution
    logger.info(en_us_validation_msg.get_header())

    # Check if the specified directory exists
    if not verify.directory_exists(input_dir_path, module, logger):
        error_message = f"The input directory {input_dir_path} does not exist."
        module.fail_json(msg=error_message)

    input_files = fetch.files_recursively(omnia_base_dir + "/" + project_name, extensions['json'])
    input_files = input_files + fetch.files_recursively(omnia_base_dir + "/" + project_name, extensions['yml'])

    input_file_dict = { fetch.file_name_from_path(file_path): file_path for file_path in input_files }

    if not input_files:
        error_message = f"yml and json files not found in directory: {input_dir_path}"
        logger.error(error_message)
        module.fail_json(msg=error_message)

    # Run L1 and L2 validation if user included a tag and extra var files.
    # Or user only had tags and no extra var files.
    error_bucket = []
    for tag_name in tag_names:
        for name in input_file_inventory.get(tag_name, []):
            fname, _ = os.path.splitext(name)

            schema_file_path = schema_base_file_path + "/" + fname + extensions['json']

            if not verify.file_exists(schema_file_path, module, logger):
                error_message = (
                    f"The file schema: {fname}.json does not exist "
                    f"in directory: {schema_base_file_path}."
                )
                logger.info(error_message)
                module.fail_json(msg=error_message)

            input_file_path = input_file_dict.get(name)

            if input_file_path is None:
                error_message = (
                    f"file not found in directory: {omnia_base_dir}/{project_name}"
                )
                logger.error(error_message)
                module.fail_json(msg=error_message)

            # Validate the schema of the input file (L1)
            l1_errors = validate.schema({
                                "input_file_path": input_file_path,
                                "schema_file_path": schema_file_path,
                                "passwords_set": passwords_set,
                                "omnia_base_dir": omnia_base_dir,
                                "project_name": project_name,
                                "logger": logger,
                                "module": module,
                            })
            if l1_errors:
                error_bucket = error_bucket + l1_errors
                schema_status = False
            else:
                schema_status = True

            # Validate the logic of the input file (L2) if L1 is success
            logic_status = True
            if schema_status:
                l2_errors = validate.logic({
                            "input_file_path": input_file_path,
                            "module_utils_base": module_utils_base,
                            "omnia_base_dir": omnia_base_dir,
                            "project_name": project_name,
                            "logger": logger,
                            "module": module,
                        })
                if l2_errors:
                    error_bucket = error_bucket + l2_errors
                    logic_status = False
                else:
                    logic_status = True
            # Append the validation status for the input file
            if (schema_status and logic_status):
                validation_status["Passed"].append(input_file_path)
            else:
                validation_status["Failed"].append(input_file_path)

            vstatus.append(schema_status)
            vstatus.append(logic_status)

    if not validation_status:
        message = "No validation has been performed. \
            Please provide tags or include individual file names."
        module.fail_json(msg=message)

    logger.error(en_us_validation_msg.get_footer())

    log_file_name = os.path.join(config.INPUT_VALIDATOR_LOG_PATH,
                                 f"validation_omnia_{project_name}.log")

    status_bool = all(vstatus)
    status_str = "completed" if status_bool else "failed"

    message = [f"Input validation {status_str} for: {project_name} input configuration(s).",
               f"Tag(s) run: {tag_names}. ",
               f"Look at the logs for more details: filename={log_file_name}"]

    module.exit_json(failed=not status_bool,
        error_msg=message,
        log_file=log_file_name,
        errors=error_bucket,
        valid_files=list(set(validation_status['Passed'])),
        invalid_files=list(set(validation_status['Failed'])),
        tags=tag_names
        )


if __name__ == "__main__":
    main()


================================================
FILE: common/library/modules/validate_user_repo.py
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

#!/usr/bin/python
# pylint: disable=import-error,no-name-in-module,line-too-long

from ansible.module_utils.basic import AnsibleModule
from ansible.module_utils.local_repo.validate_utils import validate_certificates

"""Ansible module to validate certificates for a repository."""
def main():
    """
    Main function for the Ansible module.

    Initializes the module, parses input arguments, and invokes the
    certificate validation logic. Based on the validation result,
    it either fails with a detailed error message or exits successfully
    with a success message.

    This function also handles exceptions gracefully and returns a
    well-structured response in compliance with Ansible's module API.
    """
    module_args = {
        "local_repo_config_path": {"type": "str", "required": True},
        "certs_path": {"type": "str", "required": True},
        "repo_key": {"type": "str", "required": False, "default": "user_repo_url"},
    }

    result = {
        "changed": False,
        "failed": False,
        "msg": "",
    }

    module = AnsibleModule(
        argument_spec=module_args,
        supports_check_mode=True
    )

    try:
        validation_result = validate_certificates(
            local_repo_config_path=module.params['local_repo_config_path'],
            certs_path=module.params['certs_path'],
            repo_key=module.params['repo_key']
        )

        if validation_result.get("status") == "error":
            result["failed"] = True
            result["msg"] = "Certificate validation failed for the following repositories:\n"
            for item in validation_result.get("missing", []):
                repo_name = item.split(" ")[0]
                result["msg"] += (
                    f"  - {item}\n"
                    f"    Expected certificate files should exist under: "
                    f"{module.params['certs_path']}/{repo_name}/\n"
                )
        else:
            result["msg"] = f"All certificate checks passed for '{module.params['repo_key']}'."
    except Exception as e:
        # Catching general exception at top level to return a clean failure via Ansible
        result["failed"] = True
        result["msg"] = f"Validation failed: {str(e)}"
        module.fail_json(**result)

    module.exit_json(**result)


if __name__ == '__main__':
    main()


================================================
FILE: common/tasks/common/decrypt_include_encrypt.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# Decrypt, include variables, and re-encrypt credential files
# This task handles both encrypted and unencrypted credential files

- name: Load encrypt files variables
  ansible.builtin.include_vars:
    file: "{{ role_path }}/../../../../common/vars/encrypt_files_vars.yml"

- name: Validate required parameters
  ansible.builtin.fail:
    msg: "{{ parameter_validation_error }}"
  when:
    - credential_file_path is not defined
    - vault_password_file is not defined

- name: Check credential file existence
  ansible.builtin.stat:
    path: "{{ credential_file_path }}"
  register: cred_file_stat

- name: Skip processing for non-existent files
  ansible.builtin.debug:
    msg: "{{ file_not_found_msg }}"
  when: not cred_file_stat.stat.exists

- name: Process credential file
  when: cred_file_stat.stat.exists
  block:
    - name: Check if file is encrypted
      ansible.builtin.shell: >-
        set -o pipefail && head -n1 "{{ credential_file_path }}" | grep -q '\$ANSIBLE_VAULT;'
      register: is_encrypted
      changed_when: false
      failed_when: false

    - name: Include unencrypted file directly
      ansible.builtin.include_vars: "{{ credential_file_path }}"
      no_log: true
      when: is_encrypted.rc != 0

    - name: Process encrypted file
      when: is_encrypted.rc == 0
      block:
        - name: Check vault key existence
          ansible.builtin.stat:
            path: "{{ vault_password_file }}"
          register: vault_key_stat

        - name: Fail if vault key missing for encrypted file
          ansible.builtin.fail:
            msg: "{{ vault_key_missing_error }}"
          when: not vault_key_stat.stat.exists

        - name: Decrypt credential file
          ansible.builtin.command: >-
            ansible-vault decrypt "{{ credential_file_path }}"
            --vault-password-file "{{ vault_password_file }}"
          register: decrypt_result
          changed_when: false

        - name: Include decrypted variables
          ansible.builtin.include_vars: "{{ credential_file_path }}"
          no_log: true
          when: decrypt_result is succeeded

        - name: Re-encrypt credential file
          ansible.builtin.command: >-
            ansible-vault encrypt "{{ credential_file_path }}"
            --vault-password-file "{{ vault_password_file }}"
          changed_when: false
          when: decrypt_result is succeeded

  rescue:
    - name: Cleanup on decryption failure
      block:
        - name: Re-encrypt file if partially decrypted
          ansible.builtin.command: >-
            ansible-vault encrypt "{{ credential_file_path }}"
            --vault-password-file "{{ vault_password_file }}"
          changed_when: false
          failed_when: false
          when:
            - decrypt_result is defined
            - decrypt_result is succeeded

        - name: Fail with error message
          ansible.builtin.fail:
            msg: "{{ file_processing_error }}"


================================================
FILE: common/tasks/common/get_container_image_list.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Include image variables
  ansible.builtin.include_vars: "../../vars/image_vars.yml"

- name: Add telemetry to container image list if telemetry_support is true
  when:
    - hostvars['localhost']['idrac_telemetry_support'] | default(false)
    - not hostvars['localhost']['federated_idrac_telemetry_collection'] | default(false)
  ansible.builtin.set_fact:
    container_images: >-
      {{ container_images + [
          'docker.io/library/mysql:' + mysql_tag,
          'docker.io/rmohr/activemq:' + activemq_tag,
          'docker.io/library/golang:' + golang_tag,
          'docker.io/prom/prometheus:' + prometheus_tag
        ] }}

- name: Set container_images_dict fact
  ansible.builtin.set_fact:
    container_images_dict: "{{ dict(container_images
        | map('regex_replace', '[:/]', '_')
        | map('regex_replace', '$', '.tar')
        | zip(container_images))
      }}"


================================================
FILE: common/tasks/common/openchami_auth.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Include openchami vars variables
  ansible.builtin.include_vars: "../../vars/openchami_vars.yml"

- name: Gather facts for services
  ansible.builtin.service_facts:

- name: Generate access token
  ansible.builtin.command: sudo bash -lc 'gen_access_token'
  register: access_token_result
  changed_when: false
  failed_when: false
  retries: "{{ openchami_auth_retries }}"
  delay: "{{ openchami_auth_delay }}"
  until: access_token_result.rc == 0 and access_token_result.stdout not in ["", "null"]

- name: Set ochami_env
  ansible.builtin.set_fact:
    ochami_env: "{{ {cluster_env_key: access_token_result.stdout} }}"
  when: access_token_result.rc == 0

- name: Check ochami bss status
  ansible.builtin.command: ochami bss service status
  register: bss_status_result
  changed_when: false
  failed_when: false

- name: Regenerate certificate
  when:
    - bss_status_result.rc != 0
  block:
    - name: Restart acme-deploy service
      block:
        - name: Restart acme-deploy service
          ansible.builtin.systemd_service:
            name: acme-deploy
            state: restarted
          failed_when: false
      rescue:
        - name: Failed to restart acme-deploy service
          ansible.builtin.fail:
            msg: "{{ cert_restart_fail_msg }}"

    - name: Wait for {{ cert_wait_time }} seconds before checking again # noqa: name[template]
      ansible.builtin.wait_for:
        timeout: "{{ cert_wait_time }}"

    - name: Check ochami bss status
      ansible.builtin.command: ochami bss service status
      register: bss_status_recheck
      changed_when: false
      failed_when: false

    - name: Display bss status
      ansible.builtin.debug:
        msg: "{{ bss_status_recheck.stdout }}"
        verbosity: 2


================================================
FILE: common/tasks/common/validate_image_tars.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Include task to get container_images list
  ansible.builtin.include_tasks: "get_container_image_list.yml"

- name: Find all tar files in the image directory
  ansible.builtin.find:
    paths: "{{ omnia_images_dir_path }}"
    patterns: "*.tar"
    recurse: false
  register: found_tarballs

- name: Prepare expected and existing tarball filenames
  ansible.builtin.set_fact:
    actual_tarballs: >-
      {{
        found_tarballs.files
        | map(attribute='path')
        | map('basename')
        | list
      }}

- name: Set missing tarballs
  ansible.builtin.set_fact:
    missing_tars: "{{ container_images_dict | list | difference(actual_tarballs) }}"

- name: Show missing omnia image tarballs
  ansible.builtin.debug:
    msg: "Missing container image tarballs: {{ missing_tars }}"
  when: missing_tars | length > 0

- name: Fail if any required image tarballs are missing
  ansible.builtin.fail:
    msg: "{{ omnia_images_tar_missing_final_msg }}"
  when: missing_tars | length > 0


================================================
FILE: common/tasks/provision/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


================================================
FILE: common/tasks/scheduler/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


================================================
FILE: common/tasks/telemetry/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


================================================
FILE: common/vars/common_messages.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


================================================
FILE: common/vars/common_vars.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

clone_retry: "5"
clone_delay: "10"
fail_retry: "5"
fail_delay: "10"
dir_permissions_755: "0755"
file_permissions_755: "0755"
file_permissions_644: "0644"
file_permissions_600: "0600"
file_permissions_400: "0400"
job_retry: "120"
job_delay: "30"
minio_s3_username: "admin"


================================================
FILE: common/vars/encrypt_files_vars.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# Error messages for encrypt/decrypt operations
credential_file_path_error: "credential_file_path must be provided"
vault_password_file_error: "vault_password_file must be provided"
vault_decrypt_error: "Failed to decrypt/encrypt credential file {{ credential_file_path }}. The file may be corrupted or the vault password may be incorrect."
parameter_validation_error: "Both credential_file_path and vault_password_file must be provided"
vault_key_missing_error: "Encrypted file found but vault key {{ vault_password_file }} is missing"
file_processing_error: "Failed to process credential file: {{ credential_file_path }}"
file_not_found_msg: "Credential file {{ credential_file_path }} does not exist, skipping"


================================================
FILE: common/vars/image_vars.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# Usage: get_container_image_list.yml
container_tag: "latest"
squid_tag: "6.6-24.04_beta"
pulp_tag: "3.80"
mysql_tag: "9.3.0"
prometheus_tag: "v3.4.1"
activemq_tag: "5.15.9"
grafana_image_tag: "12.0.1"
loki_image_tag: "3.5.1"
promtail_image_tag: "3.5.1"
container_images:
  - "omnia_core:{{ container_tag }}"
  - "docker.io/pulp/pulp:{{ pulp_tag }}"

# Usage: validate_image_tars.yml
omnia_images_dir_path: "/opt/omnia/images"
omnia_images_tar_missing_msg_common: >-
  The following container image tarballs are missing from the directory {{ omnia_images_dir_path }}:
  {{ missing_tars | join(', ') }}.
  Please ensure that the tarballs are present in the specified directory.
  To support either OIM HA or heirarchical provisioning or federated telemetry, these images tar file is required.
  Can use save_container_images utility to save images to tar files.
omnia_images_tar_missing_final_msg: "{{ omnia_images_tar_missing_msg | default(omnia_images_tar_missing_msg_common) | replace('\n', ' ') }}"


================================================
FILE: common/vars/openchami_image_cmd.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---


rhel_x86_64_base_image_name: "rhel-x86_64_base"
rhel_aarch64_base_image_name: "rhel-aarch64_base"

base_image_commands:
  - "dracut --add 'dmsquash-live livenet network-manager' --install '/usr/lib/systemd/systemd-sysroot-fstab-check' --kver $(basename /lib/modules/*) -N -f --logfile /tmp/dracut.log 2>/dev/null"   # noqa: yaml[line-length]
  - "echo DRACUT LOG:; cat /tmp/dracut.log"

#  x86_64 compute commands
default_x86_64_compute_commands:
  - "echo 'Default x86_64 compute'"

default_aarch64_compute_commands:
  - "echo 'Default aarch64 compute'"

login_node_x86_64_compute_commands:
  - "echo 'Login node x86_64 compute'"

login_node_aarch64_compute_commands:
  - "echo 'Login node aarch64 compute'"

login_compiler_node_x86_64_compute_commands:
  - "echo 'Login Compiler node x86_64 compute'"

service_kube_node_x86_64_compute_commands:
  - "echo 'Service kube node x86_64 compute'"

service_kube_control_plane_first_x86_64_compute_commands:
  - "echo 'Service kube control plane first x86_64 compute'"

service_kube_control_plane_x86_64_compute_commands:
  - "echo 'Service kube control plane x86_64 compute'"

slurm_control_node_x86_64_compute_commands:
  - "echo 'Slurm Control node x86_64 compute'"

slurm_node_x86_64_compute_commands:
  - "echo 'Slurm node x86_64 compute'"

# aarch64 compute commands
slurm_node_aarch64_compute_commands:
  - "echo 'Slurm node aarch64 compute'"

login_compiler_node_aarch64_compute_commands:
  - "echo 'Login Compiler node aarch64 compute'"


================================================
FILE: common/vars/openchami_vars.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

cluster_env_key: "{{ oim_node_name | upper }}_ACCESS_TOKEN"
openchami_log_dir: /opt/omnia/log/openchami
cert_wait_time: 10
cert_restart_fail_msg: "Failed to restart acme-deploy service"
openchami_auth_retries: 5
openchami_auth_delay: 5


================================================
FILE: common/vars/provision_messages.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


================================================
FILE: common/vars/provision_vars.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


================================================
FILE: common/vars/scheduler_messages.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


================================================
FILE: common/vars/scheduler_vars.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


================================================
FILE: common/vars/telemetry_messages.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


================================================
FILE: common/vars/telemetry_vars.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


================================================
FILE: discovery/ansible.cfg
================================================
[defaults]
log_path = /opt/omnia/log/core/playbooks/discovery.log
remote_tmp = /opt/omnia/tmp/.ansible/tmp/
host_key_checking = false
forks = 5
timeout = 180
executable = /bin/bash
library = library:../common/library/modules
module_utils = ../common/library/module_utils

[persistent_connection]
command_timeout = 180
connect_timeout = 180

[ssh_connection]
retries = 3
ssh_args = -o ControlMaster=auto -o ControlPersist=60 -o ConnectTimeout=60


================================================
FILE: discovery/discovery.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
- name: Check if upgrade is in progress
  ansible.builtin.import_playbook: ../utils/upgrade_checkup.yml

- name: Include input project directory
  when: not project_dir_status | default(false) | bool
  ansible.builtin.import_playbook: ../utils/include_input_dir.yml
  vars:
    openchami_vars_suppport: true
    omnia_metadata_support: true

- name: Set build_stream_job_id from environment variable
  hosts: localhost
  connection: local
  tags: always
  tasks:
    - name: Include build_stream config file
      ansible.builtin.include_vars:
        file: "{{ input_project_dir }}/build_stream_config.yml"
      failed_when: false

    - name: Set default for compute_image_suffix
      ansible.builtin.set_fact:
        compute_image_suffix: ""

    - name: Include build_stream_prerequisite.yml
      ansible.builtin.include_role:
        name: discovery_validations
        tasks_from: build_stream_prerequisite.yml
      when: enable_build_stream | default(false) | bool

- name: Create oim group and provision group
  ansible.builtin.import_playbook: ../utils/create_container_group.yml
  vars:
    oim_group: true
  tags: always

- name: Generate functional groups configuration
  ansible.builtin.import_playbook: ../utils/generate_functional_groups.yml
  tags: always

- name: Set_fact for fetch omnia config credentials
  hosts: localhost
  connection: local
  tasks:
    - name: Set dynamic run tags including 'provision'
      when: not config_file_status | default(false) | bool
      ansible.builtin.set_fact:
        omnia_run_tags: >-
          {{
            (
              ansible_run_tags | default([]) +
              ['provision', 'slurm', 'slurm_custom', 'security', 'csi_driver_powerscale', 'ldms', 'telemetry'] +
              (
                ['service_k8s']
                if ( 'service_k8s' in (
                    lookup('file', hostvars['localhost']['input_project_dir'] ~ '/software_config.json')
                    | from_json).softwares | map(attribute='name') | list )
                else []
              )
            ) | unique
          }}
        cacheable: true

- name: Invoke validate_config.yml to perform L1 and L2 validations
  when: not config_file_status | default(false) | bool
  ansible.builtin.import_playbook: ../input_validation/validate_config.yml

- name: Invoke get_config_credentials.yml
  when: not config_file_status | default(false) | bool
  ansible.builtin.import_playbook: ../utils/credential_utility/get_config_credentials.yml

- name: Validate discovery parameters
  hosts: localhost
  connection: local
  roles:
    - discovery_validations

- name: Validate OIM timezone
  hosts: oim
  connection: ssh
  tasks:
    - name: Validate OIM timezone has not changed
      ansible.builtin.include_role:
        name: discovery_validations
        tasks_from: validate_oim_timezone.yml

- name: Build cluster host lists from PXE mapping
  hosts: localhost
  connection: local
  roles:
    - passwordless_ssh

- name: Configure OIM SSH from cluster host lists
  hosts: oim
  connection: ssh
  roles:
    - passwordless_ssh

- name: Validate discovery parameters
  hosts: oim
  connection: ssh
  tasks:
    - name: Validate OpenLDAP container is running
      ansible.builtin.include_role:
        name: discovery_validations
        tasks_from: validate_openldap_container.yml
      when: hostvars['localhost']['openldap_support']

    - name: Image validation
      ansible.builtin.include_role:
        name: discovery_validations
        tasks_from: validate_image.yml
      with_items: "{{ hostvars['localhost']['functional_groups'] | map(attribute='name') | list }}"

- name: Configure auth for openchami
  hosts: oim
  connection: ssh
  tasks:
    - name: Openchami cluster authentication
      ansible.builtin.include_tasks: "{{ playbook_dir }}/../common/tasks/common/openchami_auth.yml"
      vars:
        oim_node_name: "{{ hostvars['localhost']['oim_node_name'] }}"

- name: Discover nodes, configure bss and cloud-init
  hosts: oim
  connection: ssh
  pre_tasks:
    - name: Discover nodes
      ansible.builtin.include_role:
        name: configure_ochami
        tasks_from: discover_mapping_nodes.yml

    - name: Read nodes.yaml and derive Omnia node facts
      ansible.builtin.include_role:
        name: passwordless_ssh
        tasks_from: read_nodes_yaml.yml
  roles:
    - nfs_client
    - k8s_config
    - slurm_config
    - openldap
    - telemetry
    - configure_ochami


================================================
FILE: discovery/roles/README.md
================================================
# Discovery Roles Overview

This directory contains Ansible roles for the Omnia node discovery and provisioning process. Each role handles a specific aspect of cluster node discovery, configuration, and service deployment.

## Active Roles

### 1. **configure_ochami**
Configures OpenCHAMI (Open Composable HPC Architecture Management Interface) for node management. Creates groups, sets up Boot Script Service (BSS), and configures cloud-init for node provisioning.

**Key Functions**:
- SMD group creation and management
- BSS boot parameter configuration
- Cloud-init template generation
- Node metadata management

[View Detailed README](./configure_ochami/README.md)

---

### 2. **discovery_validations**
Validates all node discovery-related configuration files and inputs before the discovery process begins. Acts as a gatekeeper to prevent misconfigured deployments.

**Key Functions**:
- Discovery input file validation
- Software configuration consistency checks
- Mapping file validation
- Telemetry configuration validation
- Hosts file updates

[View Detailed README](./discovery_validations/README.md)

---

### 3. **telemetry**
Configures telemetry services for comprehensive HPC cluster monitoring, including iDRAC telemetry streaming and LDMS (Lightweight Distributed Metric Service).

**Key Functions**:
- iDRAC telemetry streamer deployment
- LDMS sampler/aggregator/storage configuration
- Kafka and time-series database setup
- Service cluster telemetry infrastructure

[View Detailed README](./telemetry/README.md)

---

### 4. **k8s_config**
Creates Kubernetes configuration files for the service cluster and stores them in NFS-shared storage for access by service cluster nodes.

**Key Functions**:
- Kubernetes manifest generation
- Helm chart values file creation
- ConfigMap and Secret generation
- RBAC resource definitions
- NFS-based configuration management

[View Detailed README](./k8s_config/README.md)

---

### 5. **nfs_client**
Configures NFS client mounts on cluster nodes based on their functional roles. Intelligently filters and mounts only relevant NFS shares.

**Key Functions**:
- Role-based NFS mount filtering (Slurm, Kubernetes)
- NFS client package installation
- Mount point creation and configuration
- fstab management for persistent mounts
- Bolt-on storage support

[View Detailed README](./nfs_client/README.md)

---

### 6. **openldap**
Configures OpenLDAP connection parameters for centralized authentication and user management.

**Key Functions**:
- LDAP search base extraction from domain
- LDAP bind DN construction
- Connection type configuration (LDAP/LDAPS)
- Server IP and credentials setup
- Variable preparation for other roles

[View Detailed README](./openldap/README.md)

---

### 7. **slurm_config**
Configures Slurm workload manager settings and creates necessary directory structures on NFS.

**Key Functions**:
- Slurm node identification by role
- Shared directory structure creation
- State, spool, and log directory setup
- Configuration file preparation
- Support for HA Slurm deployments

[View Detailed README](./slurm_config/README.md)

---

## Role Execution Order

Typical discovery workflow role sequence:

1. **discovery_validations** - Validate all inputs
2. **nfs_client** - Mount NFS shares (if needed early)
3. **openldap** - Setup LDAP connection parameters
4. **k8s_config** - Generate Kubernetes configurations
5. **slurm_config** - Setup Slurm directories and configuration
6. **telemetry** - Deploy telemetry infrastructure
7. **configure_ochami** - Configure node provisioning
8. **nfs_client** - Mount role-specific NFS shares

---

## Common Variables

### Configuration Files
All roles reference these common configuration files:
- `omnia_config.yml`: Main cluster configuration
- `omnia_config_credentials.yml`: Sensitive credentials
- `software_config.json`: Software stack definitions
- `storage_config.yml`: NFS and storage settings
- `telemetry_config.yml`: Telemetry settings (if enabled)

### Network Configuration
- Admin network: Primary management network
- BMC network: IPMI/Redfish access
- Compute network: High-performance interconnect
- Data network: External connectivity

### Node Categories
- **Control Plane**: Kubernetes masters, Slurm controllers
- **Compute**: Workload execution nodes
- **Login**: User access nodes
- **Service**: Infrastructure services (monitoring, storage)

---

## Dependencies

### Prerequisites
- NFS server configured and accessible
- OpenCHAMI installed (for node provisioning)
- Kubernetes cluster (for service deployments)

### Network Requirements
- All nodes accessible via admin network
- NFS server reachable from all nodes
- DNS resolution configured
- Firewall rules allow required ports

---

## Integration Points

### With Other Omnia Playbooks
- **Prerequisite**: Run after base infrastructure setup
- **Followed By**: Node provisioning, workload deployment
- **Integrates With**: Control plane, monitoring, security

### With External Systems
- **OpenCHAMI**: Node lifecycle management
- **Kubernetes**: Service orchestration
- **Slurm**: Workload management
- **OpenLDAP**: User authentication
- **NFS**: Shared storage


================================================
FILE: discovery/roles/configure_ochami/README.md
================================================
# Configure OpenCHAMI Role

## Overview
Configures OpenCHAMI (Open Composable HPC Architecture Management Interface) for node lifecycle management in HPC clusters.

## Purpose
- Creates and manages SMD (State Management Database) groups for node organization
- Configures BSS (Boot Script Service) boot parameters
- Sets up cloud-init configurations for automated node provisioning
- Manages node metadata and grouping by functional roles

## Key Tasks
- **Create Groups**: Generates OpenCHAMI group definitions from mapping files
- **Configure BSS**: Sets boot parameters for node provisioning
- **Configure Cloud-Init**: Creates cloud-init templates for node initialization
- **Discovery Completion**: Finalizes the discovery process


================================================
FILE: discovery/roles/configure_ochami/tasks/configure_bss_cloud_init.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Include openchami vars
  ansible.builtin.include_vars: "{{ openchami_config_vars_path }}"

- name: Include nodes vars
  ansible.builtin.slurp:
    src: "{{ openchami_nodes_vars_path }}"
  register: nodes_vars

- name: Decode and parse nodes_vars YAML
  ansible.builtin.set_fact:
    node_parsed_yaml: "{{ nodes_vars.content | b64decode | from_yaml }}"

- name: Set nodes
  ansible.builtin.set_fact:
    nodes: "{{ node_parsed_yaml.nodes }}"

- name: Create boot and cloud-init directory
  ansible.builtin.file:
    path: "{{ bss_dir }}"
    state: directory
    mode: "{{ hostvars['localhost']['dir_permissions_755'] }}"

- name: Delete ochami bss boot params
  ansible.builtin.command: /usr/bin/ochami bss boot params delete --no-confirm -d '{"macs":["{{ item }}"]}'
  changed_when: false
  failed_when: false
  with_items: "{{ nodes | map(attribute='interfaces.0.mac_addr') | list }}"

- name: Include configure bss
  ansible.builtin.include_tasks: configure_bss_group.yml
  with_items: "{{ hostvars['localhost']['functional_groups'] | map(attribute='name') | list }}"

- name: Verify boot params set
  ansible.builtin.command: ochami bss boot params get -F yaml
  changed_when: false
  register: boot_params_output

- name: Verify boot params output
  ansible.builtin.debug:
    msg: "{{ boot_params_output.stdout_lines }}"

- name: Create cloud-init directory
  ansible.builtin.file:
    path: "{{ cloud_init_dir }}"
    state: directory
    mode: "{{ hostvars['localhost']['dir_permissions_755'] }}"

- name: Read the ssh key
  ansible.builtin.command: cat {{ ssh_key_path }}
  changed_when: false
  register: read_ssh_key
  no_log: true

- name: Read the ssh private key
  ansible.builtin.command: cat {{ ssh_private_key_path }}
  changed_when: false
  register: read_ssh_private_key
  no_log: true

- name: Hash the password
  ansible.builtin.command: openssl passwd -6 "{{ hostvars['localhost']['provision_password'] }}"
  changed_when: false
  register: hashed_password_output
  no_log: true

- name: Load ci defaults template
  ansible.builtin.template:
    src: "{{ ci_defaults_template }}"
    dest: "{{ ci_defaults_dest }}"
    mode: "{{ hostvars['localhost']['file_permissions_644'] }}"

- name: Set ci defaults configuration
  ansible.builtin.command: /usr/bin/ochami cloud-init defaults set -f yaml -d @{{ ci_defaults_dest }}
  changed_when: true

- name: Verify ci defaults configuration
  ansible.builtin.command: /usr/bin/ochami cloud-init defaults get -F json-pretty
  changed_when: false
  register: ci_defaults_output

- name: Verify ci defaults output
  ansible.builtin.debug:
    msg: "{{ ci_defaults_output.stdout_lines }}"
    verbosity: 2

- name: Configure cloud-init group
  ansible.builtin.include_tasks: configure_cloud_init_common.yml

- name: Include configure cloud init
  ansible.builtin.include_tasks: configure_cloud_init_group.yml
  with_items: "{{ hostvars['localhost']['functional_groups'] | map(attribute='name') | list }}"

- name: Set openchami SELinux context
  ansible.builtin.command: chcon -R system_u:object_r:container_file_t:s0 "{{ hostvars['localhost']['oim_shared_path'] }}/omnia/openchami"
  changed_when: true
  failed_when: false


================================================
FILE: discovery/roles/configure_ochami/tasks/configure_bss_group.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Set the functional_group_name
  ansible.builtin.set_fact:
    functional_group_name: "{{ item }}"

- name: Verify image, kernel and initramfs in S3 (build stream and image-key)
  ansible.builtin.shell: |
    set -o pipefail && \
    s3cmd ls -Hr s3://boot-images | \
    grep {{ functional_group_name }} | \
    grep {{ compute_image_suffix }} | \
    grep {{ hostvars['localhost']['cluster_os_version'] }} | awk '{print $4}' | sed 's|s3://||'
  changed_when: false
  failed_when: false
  register: verify_s3_image_build_stream
  when:
    - enable_build_stream | default(false)
    - (compute_image_suffix | default('')) != ''

- name: Verify image, kernel and initramfs in S3 (default)
  ansible.builtin.shell: |
    set -o pipefail && \
    s3cmd ls -Hr s3://boot-images | \
    grep {{ functional_group_name }} | \
    grep {{ hostvars['localhost']['cluster_os_version'] }} | awk '{print $4}' | sed 's|s3://||'
  changed_when: false
  failed_when: false
  register: verify_s3_image
  when:
    - not enable_build_stream

- name: Set kernel and initrd variables (build stream)
  ansible.builtin.set_fact:
    kernel: "{{ verify_s3_image_build_stream.stdout_lines | select('search', 'vmlinuz') | list | first }}"
    initrd: "{{ verify_s3_image_build_stream.stdout_lines | select('search', 'initramfs') | list | first }}"
  when:
    - enable_build_stream
    - (compute_image_suffix | default('')) != ''

- name: Set kernel and initrd variables (default)
  ansible.builtin.set_fact:
    kernel: "{{ verify_s3_image.stdout_lines | select('search', 'vmlinuz') | list | first }}"
    initrd: "{{ verify_s3_image.stdout_lines | select('search', 'initramfs') | list | first }}"
  when:
    - not enable_build_stream

- name: Load bss template - {{ functional_group_name }}
  ansible.builtin.template:
    src: "{{ bss_template }}"
    dest: "{{ bss_dir }}/bss-{{ functional_group_name }}.yaml"
    mode: "{{ hostvars['localhost']['file_permissions_644'] }}"

- name: Delete boot configuration - {{ functional_group_name }}
  ansible.builtin.command: /usr/bin/ochami bss boot params delete --no-confirm -f yaml -d @{{ openchami_work_dir }}/boot/bss-{{ functional_group_name }}.yaml
  changed_when: true
  failed_when: false

- name: Set boot configuration - {{ functional_group_name }}
  ansible.builtin.command: /usr/bin/ochami bss boot params set -f yaml -d @{{ openchami_work_dir }}/boot/bss-{{ functional_group_name }}.yaml
  changed_when: true


================================================
FILE: discovery/roles/configure_ochami/tasks/configure_cloud_init_common.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Delete ci group configuration - common
  ansible.builtin.command: /usr/bin/ochami cloud-init group delete --no-confirm -f yaml -d @{{ ci_group_common_dest }}
  changed_when: true
  failed_when: false

- name: Render ci group common template
  ansible.builtin.template:
    src: "{{ ci_group_common_template }}"
    dest: "{{ ci_group_common_dest }}"
    mode: "{{ hostvars['localhost']['file_permissions_644'] }}"

- name: Set ci group configuration - common
  ansible.builtin.command: /usr/bin/ochami cloud-init group set -f yaml -d @{{ ci_group_common_dest }}
  changed_when: true


================================================
FILE: discovery/roles/configure_ochami/tasks/configure_cloud_init_group.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Include vars from default
  ansible.builtin.include_vars: "{{ default_file_path }}"

- name: Set the functional_group_name
  ansible.builtin.set_fact:
    functional_group_name: "{{ item }}"

- name: Delete ci group configuration - {{ functional_group_name }}
  ansible.builtin.command: /usr/bin/ochami cloud-init group delete --no-confirm -f yaml -d @{{ cloud_init_dir }}/ci-group-{{ functional_group_name }}.yaml
  changed_when: true
  failed_when: false

- name: Load ci group template
  block:
    - name: Load ci group template - {{ functional_group_name }}
      ansible.builtin.template:
        src: "cloud_init/ci-group-{{ functional_group_name }}.yaml.j2"
        dest: "{{ cloud_init_dir }}/ci-group-{{ functional_group_name }}.yaml"
        mode: "{{ hostvars['localhost']['file_permissions_644'] }}"
  rescue:
    - name: Failed to load ci group template
      ansible.builtin.fail:
        msg: "{{ ci_group_load_fail_msg }}"

- name: Set ci group configuration - {{ functional_group_name }}
  ansible.builtin.command: /usr/bin/ochami cloud-init group set -f yaml -d @{{ cloud_init_dir }}/ci-group-{{ functional_group_name }}.yaml
  changed_when: true

- name: Verify ci group configuration - {{ functional_group_name }}
  ansible.builtin.command: /usr/bin/ochami cloud-init group get config {{ functional_group_name }}
  changed_when: false
  register: ci_group_compute_output
  no_log: true

- name: Verify ci group output - {{ functional_group_name }}
  ansible.builtin.debug:
    msg: "{{ ci_group_compute_output.stdout_lines }}"
    verbosity: 2
  no_log: true


================================================
FILE: discovery/roles/configure_ochami/tasks/create_groups.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Set the functional_group_name
  ansible.builtin.set_fact:
    functional_group_name: "{{ item }}"

- name: Load the openchami groups.yaml
  ansible.builtin.template:
    src: "{{ openchami_groups_template }}"
    dest: "{{ nodes_dir }}/groups-{{ functional_group_name }}.yml"
    mode: "{{ hostvars['localhost']['file_permissions_644'] }}"
  vars:
    nodes: "{{ hostvars['localhost']['read_mapping_file']['dict'] | dict2items }}"

- name: Get SMD group data
  ansible.builtin.command: /usr/bin/ochami smd group get
  changed_when: false
  register: smd_group_data

- name: Set existing_smd_groups
  ansible.builtin.set_fact:
    existing_smd_groups: '{{ smd_group_data.stdout | from_json }}'

- name: Get existing SMD groups
  ansible.builtin.set_fact:
    existing_smd_group_names: "{{ existing_smd_groups | map(attribute='label') | list }}"

- name: POST new SMD groups
  ansible.builtin.command: /usr/bin/ochami smd group add -f yaml -d @{{ nodes_dir }}/groups-{{ functional_group_name }}.yml
  changed_when: true
  when: functional_group_name not in existing_smd_group_names

- name: Check for group updates
  ansible.builtin.include_tasks: update_smd_groups.yaml
  when: functional_group_name in existing_smd_group_names


================================================
FILE: discovery/roles/configure_ochami/tasks/create_groups_common.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Set the common_group_name
  ansible.builtin.set_fact:
    common_group_name: "{{ item }}"

- name: Load the openchami common group - {{ common_group_name }}
  ansible.builtin.template:
    src: "{{ openchami_groups_common_template }}"
    dest: "{{ nodes_dir }}/groups-common-{{ common_group_name }}.yml"
    mode: "{{ hostvars['localhost']['file_permissions_644'] }}"
  vars:
    nodes: "{{ hostvars['localhost']['read_mapping_file']['dict'] | dict2items }}"

- name: Delete the SMD common group - {{ common_group_name }}
  ansible.builtin.command: /usr/bin/ochami smd group delete --no-confirm {{ common_group_name }}
  changed_when: true

- name: POST common SMD group
  ansible.builtin.command: /usr/bin/ochami smd group add -f yaml -d  @{{ nodes_dir }}/groups-common-{{ common_group_name }}.yml
  changed_when: true


================================================
FILE: discovery/roles/configure_ochami/tasks/delete_smd_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Delete all ochami component endpoints
  ansible.builtin.command: /usr/bin/ochami smd compep delete --no-confirm --all
  changed_when: true
  failed_when: false

- name: Delete all ochami redfish endpoints
  ansible.builtin.command: /usr/bin/ochami smd rfe delete --no-confirm --all
  changed_when: true
  failed_when: false

- name: Delete all ochami iface
  ansible.builtin.command: /usr/bin/ochami smd iface delete --no-confirm --all
  changed_when: true
  failed_when: false


================================================
FILE: discovery/roles/configure_ochami/tasks/discover_mapping_nodes.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Configure the ochami
  environment: "{{ hostvars['oim']['ochami_env'] }}"
  block:
    - name: Set openchami SELinux context
      ansible.builtin.command: chcon -R system_u:object_r:container_file_t:s0 "{{ hostvars['localhost']['oim_shared_path'] }}/omnia/openchami"
      changed_when: true
      failed_when: false

    - name: Include openchami vars
      ansible.builtin.include_vars: "{{ openchami_config_vars_path }}"

    - name: Create ochami nodes directory
      ansible.builtin.file:
        path: "{{ nodes_dir }}"
        state: directory
        mode: "{{ hostvars['localhost']['dir_permissions_755'] }}"

    - name: Load the openchami nodes.yaml
      ansible.builtin.template:
        src: "{{ openchami_nodes_template }}"
        dest: "{{ openchami_nodes_vars_path }}"
        mode: "{{ hostvars['localhost']['file_permissions_644'] }}"
      vars:
        nodes: "{{ hostvars['localhost']['read_mapping_file']['dict'] | dict2items }}"

    - name: Create telemetry directory
      ansible.builtin.file:
        path: "{{ telemetry_share_path }}"
        state: directory
        mode: "{{ hostvars['localhost']['dir_permissions_755'] }}"

    - name: Load BMC-group data file
      ansible.builtin.template:
        src: "{{ bmc_group_data_template }}"
        dest: "{{ bmc_group_data_file }}"
        mode: "{{ hostvars['localhost']['file_permissions_644'] }}"
      vars:
        nodes: "{{ hostvars['localhost']['read_mapping_file']['dict'] | dict2items }}"
        group_data: "{{ (lookup('file', hostvars['localhost']['functional_groups_config_path']) | from_yaml).groups }}"

    - name: Delete smd configuration
      ansible.builtin.include_tasks: delete_smd_config.yml

    - name: Restart the cloud-init service to clear node instance data
      ansible.builtin.service:
        name: cloud-init-server
        state: restarted

    - name: Check whether openchami.target is up
      ansible.builtin.service:
        name: openchami.target
        state: started
      register: openchami_target_status
      retries: 4
      delay: 5
      until: openchami_target_status is success

    - name: Fail if openchami.target is not up
      ansible.builtin.fail:
        msg: "openchami.target is not up"
      when:
        - openchami_target_status is defined
        - openchami_target_status is not success

    - name: Discover ochami nodes
      block:
        - name: Discover ochami nodes
          ansible.builtin.command: /usr/bin/ochami discover static -f yaml -d @"{{ openchami_nodes_vars_path }}" --overwrite
          changed_when: true
          register: openchami_discover
      rescue:
        - name: Failed to discover nodes
          ansible.builtin.debug:
            msg: "{{ discover_fail_msg }}. Error: {{ openchami_discover.stderr_lines }}"

    - name: Verify node created in smd
      ansible.builtin.shell: |
        set -o pipefail && \
        /usr/bin/ochami smd component get | jq '.Components[] | select(.Type == "Node")'
      changed_when: true
      register: openchami_smd_status

    - name: Openchami smd status output
      ansible.builtin.debug:
        msg: "{{ openchami_smd_status.stdout_lines }}"
        verbosity: 2

    - name: Load the openchami hostname.yaml
      ansible.builtin.template:
        src: "{{ openchami_hostname_template }}"
        dest: "{{ openchami_hostname_vars_path }}"
        mode: "{{ hostvars['localhost']['file_permissions_644'] }}"
      vars:
        nodes: "{{ hostvars['localhost']['read_mapping_file']['dict'] | dict2items }}"

    - name: Configure the hostname
      ansible.builtin.command: /usr/bin/ochami cloud-init node set -f yaml -d @"{{ openchami_hostname_vars_path }}"
      changed_when: true


================================================
FILE: discovery/roles/configure_ochami/tasks/discovery_completion.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Discovery completion
  ansible.builtin.debug:
    msg: "{{ discovery_completion_msg.splitlines() | join(' ') }}"


================================================
FILE: discovery/roles/configure_ochami/tasks/fetch_additional_images.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Load software_config.json
  ansible.builtin.include_vars:
    file: "{{ software_config_file_path }}"
    name: software_config
  delegate_to: localhost
  run_once: true

- name: Set dynamic additional_json_path
  ansible.builtin.set_fact:
    additional_json_path: "{{ input_project_dir }}/config/x86_64/{{ software_config.cluster_os_type }}/{{ software_config.cluster_os_version }}/additional_packages.json" # noqa: yaml[line-length]
  delegate_to: localhost
  run_once: true

- name: Collect additional container images from additional_packages.json
  additional_images_collector:
    additional_json_path: "{{ additional_json_path }}"
    software_config_path: "{{ software_config_file_path }}"
  delegate_to: localhost
  run_once: true
  register: additional_images_output

- name: Set additional_images_dict fact
  ansible.builtin.set_fact:
    additional_images_dict: "{{ additional_images_output.additional_images_dict }}"

- name: Debug additional_images_dict
  ansible.builtin.debug:
    var: additional_images_dict
    verbosity: 2

- name: Read local_repo_config.yml
  ansible.builtin.include_vars:
    file: "{{ local_repo_config_path }}"
    name: local_repo_config

- name: Set fact for user_registry
  ansible.builtin.set_fact:
    user_registry: "{{ local_repo_config.user_registry | default([]) }}"


================================================
FILE: discovery/roles/configure_ochami/tasks/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Refresh SMD access token before ochami operations
  ansible.builtin.include_tasks: "{{ role_path }}/../../../common/tasks/common/openchami_auth.yml"
  vars:
    oim_node_name: "{{ hostvars['localhost']['oim_node_name'] }}"

- name: Configure the ochami
  environment: "{{ hostvars['oim']['ochami_env'] }}"
  block:
    - name: Create groups
      ansible.builtin.include_tasks: create_groups.yml
      with_items: "{{ hostvars['localhost']['functional_groups'] | map(attribute='name') | list }}"

    - name: Fecth image of additional_packages.json file
      ansible.builtin.include_tasks: fetch_additional_images.yml

    - name: Create groups common
      ansible.builtin.include_tasks: create_groups_common.yml
      loop: "{{ common_cloud_init_groups }}"

    - name: Configure bss and cloud-init
      ansible.builtin.include_tasks: configure_bss_cloud_init.yml

    - name: Discovery completion
      ansible.builtin.include_tasks: discovery_completion.yml


================================================
FILE: discovery/roles/configure_ochami/tasks/update_smd_groups.yaml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Get SMD group data - {{ functional_group_name }}
  ansible.builtin.set_fact:
    smd_group_members: >-
      {{ (existing_smd_groups | selectattr("label", "==", functional_group_name) | first).members.ids }}

- name: Include group vars
  ansible.builtin.slurp:
    src: "{{ nodes_dir }}/groups-{{ functional_group_name }}.yml"
  register: group_vars

- name: Decode and parse group_vars YAML
  ansible.builtin.set_fact:
    group_parsed_yaml: "{{ group_vars.content | b64decode | from_yaml }}"

- name: Set inventory_group_members as comma-separated string
  ansible.builtin.set_fact:
    inventory_group_members: "{{ group_parsed_yaml[0].members.ids }}"

- name: Set changed if contents do not match - {{ functional_group_name }}
  ansible.builtin.set_fact:
    smd_group_changed: true
  when: smd_group_members | symmetric_difference(inventory_group_members) | length  > 0

- name: DELETE group - {{ functional_group_name }}
  ansible.builtin.command: /usr/bin/ochami smd group delete --no-confirm {{ functional_group_name }}
  changed_when: true
  when: smd_group_changed | default(false) | bool

- name: POST group - {{ functional_group_name }}
  ansible.builtin.command: /usr/bin/ochami smd group add -m {{ inventory_group_members | join(',') }} {{ functional_group_name }}
  changed_when: true
  when: smd_group_changed | default(false) | bool


================================================
FILE: discovery/roles/configure_ochami/templates/bss/bss.yaml.j2
================================================
---
kernel: "http://{{ cluster_boot_ip }}:9000/{{ kernel }}"
initrd: "http://{{ cluster_boot_ip }}:9000/{{ initrd }}"
{% set bs_suffix = "_" + compute_image_suffix
   if enable_build_stream | default(false)
   and (compute_image_suffix | default('')) != ''
   else "" %}
{% set root_image_path =
  "boot-images/%s/rhel-%s%s/rhel%s-rhel-%s%s-%s" % (
    functional_group_name,
    functional_group_name,
    bs_suffix,
    hostvars['localhost']['cluster_os_version'],
    functional_group_name,
    bs_suffix,
    hostvars['localhost']['cluster_os_version']
  )
%}
params: "nomodeset ro root=live:http://{{ cluster_boot_ip }}:9000/{{ root_image_path }} ip=dhcp rd.live.image rd.live.ram rd.neednet=1 rd.driver.blacklist=ccp,edac_core,power_meter,ahci,megaraid_sas modprobe.blacklist=ccp,edac_core,power_meter,ahci,megaraid_sas libata.force=1:disable,2:disable,3:disable,4:disable rd.luks=0 rd.md=0 rd.dm=0 console=tty0 console=ttyS0,115200 selinux=0 apparmor=0 ip6=off {{ bss_params_cloud_init }}"
macs:
{% for item in nodes %}
{% if item.group == functional_group_name %}
  - {{ item.interfaces[0].mac_addr }}
{% endif %}
{% endfor %}


================================================
FILE: discovery/roles/configure_ochami/templates/cloud_init/ci-defaults.yaml.j2
================================================
---
base-url: "http://{{ cluster_boot_ip }}:8081/cloud-init"
cluster-name: "{{ cluster_name }}"
nid-length: {{ cluster_nidlength }}
public-keys:
- "{{ read_ssh_key.stdout }}"
short-name: "{{ cluster_shortname }}"


================================================
FILE: discovery/roles/configure_ochami/templates/cloud_init/ci-group-common.yaml.j2
================================================
- name: ssh
  description: "ssh config"
  file:
    encoding: plain
    content: |
      ## template: jinja
      #cloud-config
      merge_how:
        - name: list
          settings: [append]
        - name: dict
          settings: [no_replace, recurse_list]
 
      write_files:
        - path: /usr/local/bin/set-ssh-config.sh
          permissions: '0755'
          content: |
            #!/bin/bash
            timedatectl set-timezone {{ hostvars['oim']['oim_timezone'] }}
            localectl set-locale LANG={{ hostvars['localhost']['language'] }}
            sed -i 's/^#PermitRootLogin.*/PermitRootLogin yes/' /etc/ssh/sshd_config
            sed -i 's/^#PasswordAuthentication.*/PasswordAuthentication yes/' /etc/ssh/sshd_config
            sed -i 's/^PasswordAuthentication.*/PasswordAuthentication yes/' /etc/ssh/sshd_config.d/50-cloud-init.conf
            systemctl restart sshd
      runcmd:
        - /usr/local/bin/set-ssh-config.sh

- name: chrony
  description: "chrony config"
  file:
    encoding: plain
    content: |
      ## template: jinja
      #cloud-config
      merge_how:
        - name: list
          settings: [append]
        - name: dict
          settings: [no_replace, recurse_list]
      write_files:
        - path: /etc/chrony.conf
          permissions: '0644'
          content: |
            server {{ cluster_boot_ip }} iburst

            driftfile /var/lib/chrony/drift
            rtcsync
            makestep 1.0 3
            logdir /var/log/chrony
            cmdport 0

      runcmd:
        - "systemctl enable chronyd"
        - "systemctl restart chronyd"
        - "chronyc sources"
        - "chronyc -a makestep"


================================================
FILE: discovery/roles/configure_ochami/templates/cloud_init/ci-group-default_x86_64.yaml.j2
================================================
- name: {{ functional_group_name }}
  description: "{{ functional_group_name }} config"
  file:
    encoding: plain
    content: |
      ## template: jinja
      #cloud-config
      merge_how:
      - name: list
        settings: [append]
      - name: dict
        settings: [no_replace, recurse_list]
      users:
        - name: root
          ssh_authorized_keys: "{{ read_ssh_key.stdout }}"
          lock_passwd: false
          hashed_passwd: "{{ hashed_password_output.stdout }}"
      disable_root: false


================================================
FILE: discovery/roles/configure_ochami/templates/cloud_init/ci-group-login_compiler_node_aarch64.yaml.j2
================================================
- name: {{ functional_group_name }}
  description: "{{ functional_group_name }} config"
  file:
    encoding: plain
    content: |
      ## template: jinja
      #cloud-config
      merge_how:
      - name: list
        settings: [append]
      - name: dict
        settings: [no_replace, recurse_list]
      users:
        - name: root
          ssh_authorized_keys: "{{ read_ssh_key.stdout }}"
          lock_passwd: false
          hashed_passwd: "{{ hashed_password_output.stdout }}"
        - name: {{ slurm_user }}
          uid: {{ slurm_uid }}
          system: true
          no_create_home: true
          shell: /sbin/nologin
      disable_root: false

      write_files:
        - path: /usr/local/bin/doca-install.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/doca-ofed/doca-install.sh.j2') | indent(12) }}

        - path: /usr/local/bin/configure-ib-network.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/doca-ofed/configure-ib-network.sh.j2') | indent(12) }}

        - path: /usr/local/bin/set-ssh.sh
          permissions: '0755'
          content: |
            #!/bin/bash
            timedatectl set-timezone {{ hostvars['oim']['oim_timezone'] }}
            sed -i 's/^#PermitRootLogin.*/PermitRootLogin yes/' /etc/ssh/sshd_config
            sed -i 's/^#PasswordAuthentication.*/PasswordAuthentication yes/' /etc/ssh/sshd_config
            sed -i 's/^PasswordAuthentication.*/PasswordAuthentication yes/' /etc/ssh/sshd_config.d/50-cloud-init.conf
            systemctl restart sshd
            default_count=$(ip route | grep -c "^default")
            if [ "$default_count" -le 1 ]; then
                echo "Only one or no default route found. No action needed."
            else
                private_nic=$(ip route | grep "^default via {{ hostvars['localhost']['admin_nic_ip'] }}" | awk '{print $5}')
                # Get all default routes
                ip route | grep '^default' | while read -r line; do
                    nmcli con del "Wired Connection"
                    # Extract NIC name
                    nic=$(echo "$line" | awk '{print $5}')

                    # Add the default route to the connection
                    if [ -n "$nic" ]; then
                        echo "Adding nmcli device $nic"
                        nmcli con add type ethernet ifname "$nic" con-name "$nic" ipv4.method auto
                        if [ "$nic" = "$private_nic" ]; then
                          nmcli con modify "$nic" ipv4.never-default yes
                          nmcli con delete "cloud-init $nic"
                        fi
                        nmcli con up "$nic"
                    else
                        echo "No connection found for device $nic"
                    fi
                done
            fi

        - path: /root/.ssh/config
          permissions: '0600'
          content: |
            Host {{ slurm_control_ssh_patterns }}
                IdentityFile {{ client_mount_path }}/slurm/ssh/oim_rsa
                IdentitiesOnly yes

        - path: /usr/local/bin/install_cuda_toolkit.sh
          permissions: '0755'
          content: |
            #!/bin/bash
            LOGFILE="/var/log/cuda_toolkit_install.log"
            exec > >(tee -a "$LOGFILE") 2>&1

            echo "===== Starting CUDA Toolkit installation ====="

            # Check if CUDA toolkit is already installed
            if command -v nvcc &>/dev/null; then
                CUDA_VERSION=$(nvcc --version | grep "release" | awk '{print $6}' | sed 's/,//')
                echo "[INFO] CUDA toolkit already installed (version: ${CUDA_VERSION}). Exiting."
                exit 0
            fi

            echo "[INFO] Mounting NFS runfile directory for CUDA toolkit..."
            mkdir -p /cuda-runfile
            mount -t nfs {{ cloud_init_nfs_path }}/hpc_tools/runfile /cuda-runfile

            if [ $? -ne 0 ]; then
                echo "[ERROR] Failed to mount NFS runfile share. Exiting."
                exit 1
            fi

            echo "[INFO] Setting up shared CUDA directory..."
            # Create and mount shared directory for compute nodes
            mkdir -p /shared-cuda-toolkit
            mount -t nfs {{ cloud_init_nfs_path }}/hpc_tools/cuda/ /shared-cuda-toolkit

            if [ $? -ne 0 ]; then
                echo "[ERROR] Failed to mount NFS cuda share. Exiting."
                umount /cuda-runfile 2>/dev/null
                exit 1
            fi

            echo "[INFO] Installing CUDA toolkit directly to shared NFS location..."
            if [ -f "/cuda-runfile/{{ cuda_runfile_aarch64 }}" ]; then
                mkdir -p /shared-cuda-toolkit/tmp
                # Install toolkit directly to the NFS-mounted shared location
                bash /cuda-runfile/{{ cuda_runfile_aarch64 }} --silent --toolkit --tmpdir=/shared-cuda-toolkit/tmp --toolkitpath=/shared-cuda-toolkit --override

                if [ $? -eq 0 ]; then
                    echo "[SUCCESS] CUDA toolkit installed successfully to shared location."

                    # Set up environment variables pointing to shared location
                    cat > /etc/profile.d/cuda.sh << 'ENDOFFILE'
            export PATH=/shared-cuda-toolkit/bin:$PATH
            export LD_LIBRARY_PATH=/shared-cuda-toolkit/lib64:$LD_LIBRARY_PATH
            export CUDA_HOME=/shared-cuda-toolkit
            ENDOFFILE

                    # Apply environment variables for current session
                    export PATH=/shared-cuda-toolkit/bin:$PATH
                    export LD_LIBRARY_PATH=/shared-cuda-toolkit/lib64:$LD_LIBRARY_PATH
                    export CUDA_HOME=/shared-cuda-toolkit

                    echo "[INFO] CUDA environment configured"
                else
                    echo "[ERROR] CUDA toolkit installation failed."
                fi
            else
                echo "[ERROR] CUDA toolkit runfile not found in /cuda-runfile/"
            fi

            echo "[INFO] Verifying CUDA toolkit installation..."
            if command -v nvcc &>/dev/null; then
                CUDA_VERSION=$(nvcc --version | grep "release" | awk '{print $6}' | sed 's/,//')
                echo "[SUCCESS] CUDA toolkit verified: version $CUDA_VERSION"
                echo "[INFO] CUDA installation path: $(which nvcc)"
            else
                echo "[ERROR] CUDA toolkit (nvcc) not found after installation."
            fi

            echo "[INFO] Setting up shared CUDA directory for compute nodes..."
            # Create shared directory for compute nodes to mount
            mkdir -p /shared-cuda-toolkit
            # Mount the shared NFS location where compute nodes will access the toolkit
            mount -t nfs {{ cloud_init_nfs_path }}/hpc_tools/cuda/ /shared-cuda-toolkit

            echo "[INFO] Copying CUDA toolkit to shared location..."
            # Copy the installed CUDA toolkit to the shared location for compute nodes
            #rsync -av /usr/local/cuda/ /shared-cuda-toolkit/ --exclude='*.a' --exclude='doc/'
            cp -r /usr/local/cuda/* /shared-cuda-toolkit/ 2>/dev/null || true

            echo "[INFO] Cleaning up temporary mounts..."
            umount /cuda-runfile 2>/dev/null
            rmdir /cuda-runfile 2>/dev/null

            echo "===== CUDA Toolkit installation completed ====="

{% if hostvars['localhost']['openldap_support'] %}
        - path: /etc/sssd/sssd.conf
          owner: root:root
          permissions: '{{ file_mode_600 }}'
          content: |
            {{ lookup('template', 'templates/openldap/sssd.conf.j2') | indent(6) }}

        - path: /usr/local/bin/update_ldap_conf.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/openldap/update_ldap_conf.sh.j2') | indent(12) }}
{% endif %}

{% if hostvars['localhost']['ldms_support'] %}
        - path: /root/ldms_sampler.sh
          owner: root:root
          permissions: '0755'
          content: |
            {{ lookup('template', 'templates/ldms/ldms_sampler.sh.j2') | indent(12) }}
{% endif %}

        - path: /usr/local/bin/install_openmpi.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/hpc_tools/install_openmpi.sh.j2') | indent(12) }}

        - path: /usr/local/bin/install_ucx.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/hpc_tools/install_ucx.sh.j2') | indent(12) }}

        - path: /etc/hosts
          append: true
          content: |
{% for key in ip_name_map | sort %}
            {{ ip_name_map[key] }} {{ key }}
{% endfor %}

        - path: /etc/sysconfig/slurmd
          owner: root:root
          permissions: '0644'
          content: |
            SLURMD_OPTIONS="{{ conf_server }}"

        - path: /usr/local/bin/check_slurm_controller_status.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/slurm/check_slurm_controller_status.sh.j2') | indent(12) }}

        - path: /tmp/apptainer_mirror.conf
          permissions: '0644'
          content: |
            {{ lookup('template', 'templates/nodes/apptainer_mirror.conf.j2') | indent(12) }}
        
        - path: /usr/local/bin/install_nvhpc_sdk.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/hpc_tools/install_nvhpc_sdk.sh.j2') | indent(12) }}
        
        - path: /usr/local/bin/configure_nvhpc_env.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/hpc_tools/configure_nvhpc_env.sh.j2') | indent(12) }}

      runcmd:
        - /usr/local/bin/set-ssh.sh
        - /usr/local/bin/install_cuda_toolkit.sh
        # Ensure Slurm NFS root is mounted at client_mount_path (e.g. /share_omnia)
        - mkdir -p {{ client_mount_path }}/slurm/ssh
        - mkdir -p {{ slurm_slurmd_log_dir_effective }} {{ slurm_slurmd_pid_dir_effective }} {{ slurm_slurmd_spool_dir_effective }} {{ slurm_epilog_dirs_all | join(' ') }} {% for d in slurm_prolog_dirs_all %}{{ d }} {% endfor %}/etc/munge /cert /var/log/track /var/lib/packages /hpc_tools
        - echo "{{ cloud_init_nfs_path }}/$(hostname -s)/var/log/slurm  {{ slurm_slurmd_log_dir_effective }}   nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path }}/$(hostname -s)/var/spool/slurmd      {{ slurm_slurmd_spool_dir_effective }}       nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path }}/$(hostname -s)/etc/slurm/epilog.d     /etc/slurm/epilog.d      nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path }}/$(hostname -s)/etc/munge      /etc/munge       nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ trackfile_nfs_path }}    /var/log/track       nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path}}/hpc_tools  /hpc_tools   nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path }}/ssh {{ client_mount_path }}/slurm/ssh nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path }}/cert  /cert   nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path }}/packages  /var/lib/packages   nfs defaults,_netdev 0 0" >> /etc/fstab
        - chmod {{ file_mode }} /etc/fstab
        - mount -a
        - cp /cert/pulp_webserver.crt /etc/pki/ca-trust/source/anchors && update-ca-trust
        - sed -i 's/^gpgcheck=1/gpgcheck=0/' /etc/dnf/dnf.conf

{% if hostvars['localhost']['ucx_support'] or hostvars['localhost']['openmpi_support'] or hostvars['localhost']['ldms_support'] %}
        # Add NFS entry and mount
        - mkdir -p {{ client_mount_path }}
        - echo "{{ cloud_init_slurm_nfs_path }} {{ client_mount_path }} nfs defaults,_netdev 0 0" >> /etc/fstab
        - mount -a
{% endif %}

{% if hostvars['localhost']['ucx_support'] %}
        - echo "===== UCX Setup ====="
        - echo "UCX support is enabled."
        - /usr/local/bin/install_ucx.sh
        # - echo "Build script available at"
        # - echo "  /usr/local/bin/install_ucx.sh"
        # - echo "NFS must be mounted at {{ client_mount_path }} before running."
{% endif %}

{% if hostvars['localhost']['openmpi_support'] %}
        - echo "===== OpenMPI Setup ====="
        - echo "OpenMPI support is enabled."
        - /usr/local/bin/install_openmpi.sh
        # - echo "Build script available at"
        # - echo "  /usr/local/bin/install_openmpi.sh"
        # - echo "Run UCX installation first if UCX support is enabled."
        # - echo "NFS must be mounted at {{ client_mount_path }} before running."
{% endif %}

{% if hostvars['localhost']['ldms_support'] %}
        - echo " Starting LDMS setup " | tee -a /var/log/ldms-cloudinit.log
        - /root/ldms_sampler.sh
{% endif %}

        - bash /usr/local/bin/doca-install.sh && bash /usr/local/bin/configure-ib-network.sh
        - /usr/local/bin/check_slurm_controller_status.sh
        - chown -R {{ slurm_user }}:{{ slurm_user }} {{ slurm_slurmd_log_dir_effective }}
        - chown -R {{ slurm_user }}:{{ slurm_user }} {{ slurm_slurmd_pid_dir_effective }}
        - chown -R {{ slurm_user }}:{{ slurm_user }} {{ slurm_slurmd_spool_dir_effective }}
        - chown -R {{ munge_user }}:{{ munge_group }} /etc/munge/munge.key
        - chmod {{ file_mode_755 }} {{ slurm_slurmd_log_dir_effective }} {{ slurm_slurmd_pid_dir_effective }} {{ slurm_slurmd_spool_dir_effective }}
        - chmod {{ file_mode_400 }} /etc/munge/munge.key
        - chmod {{ file_mode_755 }} /etc/slurm/epilog.d/
{% for epath in slurm_epilog_custom_paths %}
        - bash -c 'if [ ! -f "{{ epath }}" ]; then mkdir -p "$(dirname "{{ epath }}")"; printf "#!/bin/bash\n# Custom epilog script placeholder\n# Add your epilog commands here\n" > "{{ epath }}"; chown {{ slurm_user }}:{{ slurm_user }} "{{ epath }}"; chmod {{ file_mode_755 }} "{{ epath }}"; fi'
{% endfor %}
{% for ppath in slurm_prolog_custom_paths %}
        - bash -c 'if [ ! -f "{{ ppath }}" ]; then mkdir -p "$(dirname "{{ ppath }}")"; printf "#!/bin/bash\n# Custom prolog script placeholder\n# Add your prolog commands here\n" > "{{ ppath }}"; chown {{ slurm_user }}:{{ slurm_user }} "{{ ppath }}"; chmod {{ file_mode_755 }} "{{ ppath }}"; fi'
{% endfor %}
        - mkdir -p {{ slurm_slurmd_spool_dir_effective }}
        - chmod {{ file_mode_755 }} {{ slurm_slurmd_spool_dir_effective }}
        - chown -R {{ slurm_user }}:{{ slurm_user }} {{ slurm_slurmd_spool_dir_effective }}
        - setenforce 0
        - systemctl enable firewalld
        - systemctl start firewalld
        - firewall-cmd --permanent --add-service=ssh
        - firewall-cmd --permanent --add-port={{ slurm_conf_dict.SrunPortRange }}/tcp
        - firewall-cmd --permanent --add-port={{ slurm_conf_dict.SrunPortRange }}/udp
        - firewall-cmd --permanent --add-port={{  slurm_conf_dict.SlurmdPort }}/tcp
        - firewall-cmd --permanent --add-port={{ slurm_conf_dict.SlurmdPort }}/udp
        
        # Add PXE network to trusted zone for ORTE communication
        - echo "[INFO] Adding PXE network to trusted zone for ORTE communication"
        - |
          bash -c '
          ADMIN_IP="{{ hostvars['localhost']['admin_nic_ip'] }}"
          NETMASK_BITS="{{ hostvars['localhost']['admin_netmask_bits'] }}"
          
          # Convert IP to integer and calculate network address
          ip_to_int() {
            local IFS=.
            read -r a b c d <<< "$1"
            echo $(( (a << 24) + (b << 16) + (c << 8) + d ))
          }
          
          int_to_ip() {
            local ip=$1
            echo "$(( (ip >> 24) & 255 )).$(( (ip >> 16) & 255 )).$(( (ip >> 8) & 255 )).$(( ip & 255 ))"  
          }
          
          ADMIN_IP_INT=$(ip_to_int "$ADMIN_IP")
          HOST_BITS=$(( 32 - NETMASK_BITS ))
          HOST_MASK=$(( (1 << HOST_BITS) - 1 ))
          NETWORK_MASK=$(( ~HOST_MASK & 0xFFFFFFFF ))
          NETWORK_INT=$(( ADMIN_IP_INT & NETWORK_MASK ))
          NETWORK_IP=$(int_to_ip "$NETWORK_INT")
          
          PXE_SUBNET="$NETWORK_IP/$NETMASK_BITS"
          echo "[INFO] Admin IP: $ADMIN_IP, Netmask: /$NETMASK_BITS, PXE Subnet: $PXE_SUBNET"
          firewall-cmd --zone=trusted --add-source="$PXE_SUBNET" --permanent
          '
        
        - firewall-cmd --reload
        - systemctl enable sshd
        - systemctl start sshd
        - systemctl enable munge
        - systemctl start munge
        - systemctl enable slurmd
        - systemctl start slurmd
        - systemctl daemon-reexec
        - systemctl restart sshd
        - cp /cert/pulp_webserver.crt /etc/pki/ca-trust/source/anchors && update-ca-trust
        - sed -i 's/^gpgcheck=1/gpgcheck=0/' /etc/dnf/dnf.conf
        - mkdir -p /etc/containers/registries.conf.d
        - mv /tmp/apptainer_mirror.conf /etc/containers/registries.conf.d/apptainer_mirror.conf

{% if hostvars['localhost']['openldap_support'] %}
        - /usr/local/bin/update_ldap_conf.sh
        - mkdir /ldapcerts
        - echo "{{ cloud_init_nfs_path_openldap }}/certs                /ldapcerts       nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path_openldap }}/ldapuser             /home            nfs defaults,_netdev 0 0" >> /etc/fstab
        - chmod {{ file_mode }} /etc/fstab
        - mount -a
        - yes | cp /ldapcerts/* /etc/openldap/certs
        - umount /ldapcerts

        - firewall-cmd --permanent --add-port={{ ldap_starttls_port }}/tcp
        - firewall-cmd --permanent --add-port={{ ldap_ssl_port }}/tcp
        - firewall-cmd --reload

        - setenforce 0
        - authselect select sssd with-mkhomedir --force
        - sudo systemctl enable --now oddjobd.service
        - sudo systemctl enable --now sssd
        - setsebool -P authlogin_nsswitch_use_ldap on
        - setsebool -P authlogin_yubikey on
        - sudo systemctl restart sssd
        - systemctl restart sshd

{% endif %}

        # nvidia sdk install
        - /usr/local/bin/install_nvhpc_sdk.sh
        - /usr/local/bin/configure_nvhpc_env.sh
        - echo "Cloud-Init has completed successfully."


================================================
FILE: discovery/roles/configure_ochami/templates/cloud_init/ci-group-login_compiler_node_x86_64.yaml.j2
================================================
- name: {{ functional_group_name }}
  description: "{{ functional_group_name }} config"
  file:
    encoding: plain
    content: |
      ## template: jinja
      #cloud-config
      merge_how:
      - name: list
        settings: [append]
      - name: dict
        settings: [no_replace, recurse_list]
      users:
        - name: root
          ssh_authorized_keys: "{{ read_ssh_key.stdout }}"
          lock_passwd: false
          hashed_passwd: "{{ hashed_password_output.stdout }}"
        - name: {{ slurm_user }}
          uid: {{ slurm_uid }}
          system: true
          no_create_home: true
          shell: /sbin/nologin
      disable_root: false

      write_files:
        - path: /usr/local/bin/doca-install.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/doca-ofed/doca-install.sh.j2') | indent(12) }}

        - path: /usr/local/bin/configure-ib-network.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/doca-ofed/configure-ib-network.sh.j2') | indent(12) }}

        - path: /usr/local/bin/set-ssh.sh
          permissions: '0755'
          content: |
            #!/bin/bash
            timedatectl set-timezone {{ hostvars['oim']['oim_timezone'] }}
            sed -i 's/^#PermitRootLogin.*/PermitRootLogin yes/' /etc/ssh/sshd_config
            sed -i 's/^#PasswordAuthentication.*/PasswordAuthentication yes/' /etc/ssh/sshd_config
            sed -i 's/^PasswordAuthentication.*/PasswordAuthentication yes/' /etc/ssh/sshd_config.d/50-cloud-init.conf
            systemctl restart sshd
            default_count=$(ip route | grep -c "^default")
            if [ "$default_count" -le 1 ]; then
                echo "Only one or no default route found. No action needed."
            else
                private_nic=$(ip route | grep "^default via {{ hostvars['localhost']['admin_nic_ip'] }}" | awk '{print $5}')
                # Get all default routes
                ip route | grep '^default' | while read -r line; do
                    nmcli con del "Wired Connection"
                    # Extract NIC name
                    nic=$(echo "$line" | awk '{print $5}')

                    # Add the default route to the connection
                    if [ -n "$nic" ]; then
                        echo "Adding nmcli device $nic"
                        nmcli con add type ethernet ifname "$nic" con-name "$nic" ipv4.method auto
                        if [ "$nic" = "$private_nic" ]; then
                          nmcli con modify "$nic" ipv4.never-default yes
                          nmcli con delete "cloud-init $nic"
                        fi
                        nmcli con up "$nic"
                    else
                        echo "No connection found for device $nic"
                    fi
                done
            fi
        
        - path: /root/.ssh/config
          permissions: '0600'
          content: |
            Host {{ slurm_control_ssh_patterns }}
                IdentityFile {{ client_mount_path }}/slurm/ssh/oim_rsa
                IdentitiesOnly yes

        - path: /usr/local/bin/install_cuda_toolkit.sh
          permissions: '0755'
          content: |
            #!/bin/bash
            LOGFILE="/var/log/cuda_toolkit_install.log"
            exec > >(tee -a "$LOGFILE") 2>&1

            echo "===== Starting CUDA Toolkit installation ====="

            # Check if CUDA toolkit is already installed
            if command -v nvcc &>/dev/null; then
                CUDA_VERSION=$(nvcc --version | grep "release" | awk '{print $6}' | sed 's/,//')
                echo "[INFO] CUDA toolkit already installed (version: ${CUDA_VERSION}). Exiting."
                exit 0
            fi

            echo "[INFO] Mounting NFS runfile directory for CUDA toolkit..."
            mkdir -p /cuda-runfile
            mount -t nfs {{ cloud_init_nfs_path }}/hpc_tools/runfile /cuda-runfile

            if [ $? -ne 0 ]; then
                echo "[ERROR] Failed to mount NFS runfile share. Exiting."
                exit 1
            fi

            echo "[INFO] Setting up shared CUDA directory..."
            # Create and mount shared directory for compute nodes
            mkdir -p /shared-cuda-toolkit
            mount -t nfs {{ cloud_init_nfs_path }}/hpc_tools/cuda/ /shared-cuda-toolkit

            if [ $? -ne 0 ]; then
                echo "[ERROR] Failed to mount NFS cuda share. Exiting."
                umount /cuda-runfile 2>/dev/null
                exit 1
            fi

            echo "[INFO] Installing CUDA toolkit directly to shared NFS location..."
            if [ -f "/cuda-runfile/{{ cuda_runfile_x86_64 }}" ]; then
                mkdir -p /shared-cuda-toolkit/tmp
                # Install toolkit directly to the NFS-mounted shared location
                bash /cuda-runfile/{{ cuda_runfile_x86_64 }} --silent --toolkit --tmpdir=/shared-cuda-toolkit/tmp --toolkitpath=/shared-cuda-toolkit --override

                if [ $? -eq 0 ]; then
                    echo "[SUCCESS] CUDA toolkit installed successfully to shared location."

                    # Set up environment variables pointing to shared location
                    cat > /etc/profile.d/cuda.sh << 'ENDOFFILE'
            export PATH=/shared-cuda-toolkit/bin:$PATH
            export LD_LIBRARY_PATH=/shared-cuda-toolkit/lib64:$LD_LIBRARY_PATH
            export CUDA_HOME=/shared-cuda-toolkit
            ENDOFFILE

                    # Apply environment variables for current session
                    export PATH=/shared-cuda-toolkit/bin:$PATH
                    export LD_LIBRARY_PATH=/shared-cuda-toolkit/lib64:$LD_LIBRARY_PATH
                    export CUDA_HOME=/shared-cuda-toolkit

                    echo "[INFO] CUDA environment configured"
                else
                    echo "[ERROR] CUDA toolkit installation failed."
                fi
            else
                echo "[ERROR] CUDA toolkit runfile not found in /cuda-runfile/"
            fi

            echo "[INFO] Verifying CUDA toolkit installation..."
            if command -v nvcc &>/dev/null; then
                CUDA_VERSION=$(nvcc --version | grep "release" | awk '{print $6}' | sed 's/,//')
                echo "[SUCCESS] CUDA toolkit verified: version $CUDA_VERSION"
                echo "[INFO] CUDA installation path: $(which nvcc)"
            else
                echo "[ERROR] CUDA toolkit (nvcc) not found after installation."
            fi

            echo "[INFO] Setting up shared CUDA directory for compute nodes..."
            # Create shared directory for compute nodes to mount
            mkdir -p /shared-cuda-toolkit
            # Mount the shared NFS location where compute nodes will access the toolkit
            mount -t nfs {{ cloud_init_nfs_path }}/hpc_tools/cuda/ /shared-cuda-toolkit

            echo "[INFO] Copying CUDA toolkit to shared location..."
            # Copy the installed CUDA toolkit to the shared location for compute nodes
            #rsync -av /usr/local/cuda/ /shared-cuda-toolkit/ --exclude='*.a' --exclude='doc/'
            cp -r /usr/local/cuda/* /shared-cuda-toolkit/ 2>/dev/null || true

            echo "[INFO] Cleaning up temporary mounts..."
            umount /cuda-runfile 2>/dev/null
            rmdir /cuda-runfile 2>/dev/null

            echo "===== CUDA Toolkit installation completed ====="

{% if hostvars['localhost']['openldap_support'] %}
        - path: /etc/sssd/sssd.conf
          owner: root:root
          permissions: '{{ file_mode_600 }}'
          content: |
            {{ lookup('template', 'templates/openldap/sssd.conf.j2') | indent(6) }}

        - path: /usr/local/bin/update_ldap_conf.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/openldap/update_ldap_conf.sh.j2') | indent(12) }}
{% endif %}

{% if hostvars['localhost']['ldms_support'] %}
        - path: /root/ldms_sampler.sh
          owner: root:root
          permissions: '0755'
          content: |
            {{ lookup('template', 'templates/ldms/ldms_sampler.sh.j2') | indent(12) }}
{% endif %}

        - path: /usr/local/bin/install_openmpi.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/hpc_tools/install_openmpi.sh.j2') | indent(12) }}

        - path: /usr/local/bin/install_ucx.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/hpc_tools/install_ucx.sh.j2') | indent(12) }}

        - path: /etc/hosts
          append: true
          content: |
{% for key in ip_name_map | sort %}
            {{ ip_name_map[key] }} {{ key }}
{% endfor %}

        - path: /etc/sysconfig/slurmd
          owner: root:root
          permissions: '0644'
          content: |
            SLURMD_OPTIONS="{{ conf_server }}"

        - path: /usr/local/bin/check_slurm_controller_status.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/slurm/check_slurm_controller_status.sh.j2') | indent(12) }}

        - path: /tmp/apptainer_mirror.conf
          permissions: '0644'
          content: |
            {{ lookup('template', 'templates/nodes/apptainer_mirror.conf.j2') | indent(12) }}
        
        - path: /usr/local/bin/install_nvhpc_sdk.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/hpc_tools/install_nvhpc_sdk.sh.j2') | indent(12) }}
        
        - path: /usr/local/bin/configure_nvhpc_env.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/hpc_tools/configure_nvhpc_env.sh.j2') | indent(12) }}

      runcmd:
        - /usr/local/bin/set-ssh.sh
        - /usr/local/bin/install_cuda_toolkit.sh

        # Ensure Slurm NFS root is mounted at client_mount_path (e.g. /share_omnia)
        - mkdir -p {{ client_mount_path }}/slurm/ssh 
        - mkdir -p {{ slurm_slurmd_log_dir_effective }} {{ slurm_slurmd_pid_dir_effective }} {{ slurm_slurmd_spool_dir_effective }} {{ slurm_epilog_dirs_all | join(' ') }} {% for d in slurm_prolog_dirs_all %}{{ d }} {% endfor %}/etc/munge /cert /var/log/track /var/lib/packages /hpc_tools
        - echo "{{ cloud_init_nfs_path }}/$(hostname -s)/var/log/slurm  {{ slurm_slurmd_log_dir_effective }}   nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path }}/$(hostname -s)/var/spool/slurmd      {{ slurm_slurmd_spool_dir_effective }}       nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path }}/$(hostname -s)/etc/slurm/epilog.d     /etc/slurm/epilog.d      nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path }}/$(hostname -s)/etc/munge      /etc/munge       nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ trackfile_nfs_path }}    /var/log/track       nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path}}/hpc_tools  /hpc_tools   nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path }}/ssh {{ client_mount_path }}/slurm/ssh nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path }}/cert  /cert   nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path }}/packages  /var/lib/packages   nfs defaults,_netdev 0 0" >> /etc/fstab

        - chmod {{ file_mode }} /etc/fstab
        - mount -a
        - cp /cert/pulp_webserver.crt /etc/pki/ca-trust/source/anchors && update-ca-trust
        - sed -i 's/^gpgcheck=1/gpgcheck=0/' /etc/dnf/dnf.conf

{% if hostvars['localhost']['ucx_support'] or hostvars['localhost']['openmpi_support'] or hostvars['localhost']['ldms_support'] %}
        # Add NFS entry and mount
        - mkdir -p {{ client_mount_path }}
        - echo "{{ cloud_init_slurm_nfs_path }} {{ client_mount_path }} nfs defaults,_netdev 0 0" >> /etc/fstab
        - mount -a
{% endif %}

{% if hostvars['localhost']['ucx_support'] %}
        - echo "===== UCX Setup ====="
        - echo "UCX support is enabled."
        - /usr/local/bin/install_ucx.sh
        # - echo "Build script available at"
        # - echo "  /usr/local/bin/install_ucx.sh"
        # - echo "NFS must be mounted at {{ client_mount_path }} before running."
{% endif %}

{% if hostvars['localhost']['openmpi_support'] %}
        - echo "===== OpenMPI Setup ====="
        - echo "OpenMPI support is enabled."
        - /usr/local/bin/install_openmpi.sh
        # - echo "Build script available at"
        # - echo "  /usr/local/bin/install_openmpi.sh"
        # - echo "Run UCX installation first if UCX support is enabled."
        # - echo "NFS must be mounted at {{ client_mount_path }} before running."
{% endif %}

{% if hostvars['localhost']['ldms_support'] %}
        - echo " Starting LDMS setup " | tee -a /var/log/ldms-cloudinit.log
        - /root/ldms_sampler.sh
{% endif %}

        - bash /usr/local/bin/doca-install.sh && bash /usr/local/bin/configure-ib-network.sh
        - /usr/local/bin/check_slurm_controller_status.sh
        - chown -R {{ slurm_user }}:{{ slurm_user }} {{ slurm_slurmd_log_dir_effective }}
        - chown -R {{ slurm_user }}:{{ slurm_user }} {{ slurm_slurmd_pid_dir_effective }}
        - chown -R {{ slurm_user }}:{{ slurm_user }} {{ slurm_slurmd_spool_dir_effective }}
        - chown -R {{ munge_user }}:{{ munge_group }} /etc/munge/munge.key
        - chmod {{ file_mode_755 }} {{ slurm_slurmd_log_dir_effective }} {{ slurm_slurmd_pid_dir_effective }} {{ slurm_slurmd_spool_dir_effective }}
        - chmod {{ file_mode_400 }} /etc/munge/munge.key
        - chmod {{ file_mode_755 }} /etc/slurm/epilog.d/
{% for epath in slurm_epilog_custom_paths %}
        - bash -c 'if [ ! -f "{{ epath }}" ]; then mkdir -p "$(dirname "{{ epath }}")"; printf "#!/bin/bash\n# Custom epilog script placeholder\n# Add your epilog commands here\n" > "{{ epath }}"; chown {{ slurm_user }}:{{ slurm_user }} "{{ epath }}"; chmod {{ file_mode_755 }} "{{ epath }}"; fi'
{% endfor %}
{% for ppath in slurm_prolog_custom_paths %}
        - bash -c 'if [ ! -f "{{ ppath }}" ]; then mkdir -p "$(dirname "{{ ppath }}")"; printf "#!/bin/bash\n# Custom prolog script placeholder\n# Add your prolog commands here\n" > "{{ ppath }}"; chown {{ slurm_user }}:{{ slurm_user }} "{{ ppath }}"; chmod {{ file_mode_755 }} "{{ ppath }}"; fi'
{% endfor %}
        - mkdir -p {{ slurm_slurmd_spool_dir_effective }}
        - chmod {{ file_mode_755 }} {{ slurm_slurmd_spool_dir_effective }}
        - chown -R {{ slurm_user }}:{{ slurm_user }} {{ slurm_slurmd_spool_dir_effective }}
        - setenforce 0
        - systemctl enable firewalld
        - systemctl start firewalld
        - firewall-cmd --permanent --add-service=ssh
        - firewall-cmd --permanent --add-port={{ slurm_conf_dict.SrunPortRange }}/tcp
        - firewall-cmd --permanent --add-port={{ slurm_conf_dict.SrunPortRange }}/udp
        - firewall-cmd --permanent --add-port={{  slurm_conf_dict.SlurmdPort }}/tcp
        - firewall-cmd --permanent --add-port={{ slurm_conf_dict.SlurmdPort }}/udp
        
        # Add PXE network to trusted zone for ORTE communication
        - echo "[INFO] Adding PXE network to trusted zone for ORTE communication"
        - |
          bash -c '
          ADMIN_IP="{{ hostvars['localhost']['admin_nic_ip'] }}"
          NETMASK_BITS="{{ hostvars['localhost']['admin_netmask_bits'] }}"
          
          # Convert IP to integer and calculate network address
          ip_to_int() {
            local IFS=.
            read -r a b c d <<< "$1"
            echo $(( (a << 24) + (b << 16) + (c << 8) + d ))
          }
          
          int_to_ip() {
            local ip=$1
            echo "$(( (ip >> 24) & 255 )).$(( (ip >> 16) & 255 )).$(( (ip >> 8) & 255 )).$(( ip & 255 ))"  
          }
          
          ADMIN_IP_INT=$(ip_to_int "$ADMIN_IP")
          HOST_BITS=$(( 32 - NETMASK_BITS ))
          HOST_MASK=$(( (1 << HOST_BITS) - 1 ))
          NETWORK_MASK=$(( ~HOST_MASK & 0xFFFFFFFF ))
          NETWORK_INT=$(( ADMIN_IP_INT & NETWORK_MASK ))
          NETWORK_IP=$(int_to_ip "$NETWORK_INT")
          
          PXE_SUBNET="$NETWORK_IP/$NETMASK_BITS"
          echo "[INFO] Admin IP: $ADMIN_IP, Netmask: /$NETMASK_BITS, PXE Subnet: $PXE_SUBNET"
          firewall-cmd --zone=trusted --add-source="$PXE_SUBNET" --permanent
          '
        
        - firewall-cmd --reload
        - systemctl enable sshd
        - systemctl start sshd
        - systemctl enable munge
        - systemctl start munge
        - systemctl enable slurmd
        - systemctl start slurmd
        - systemctl daemon-reexec
        - systemctl restart sshd
        - cp /cert/pulp_webserver.crt /etc/pki/ca-trust/source/anchors && update-ca-trust
        - sed -i 's/^gpgcheck=1/gpgcheck=0/' /etc/dnf/dnf.conf
        - mkdir -p /etc/containers/registries.conf.d
        - mv /tmp/apptainer_mirror.conf /etc/containers/registries.conf.d/apptainer_mirror.conf

{% if hostvars['localhost']['openldap_support'] %}
        - /usr/local/bin/update_ldap_conf.sh
        - mkdir /ldapcerts
        - echo "{{ cloud_init_nfs_path_openldap }}/certs                /ldapcerts       nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path_openldap }}/ldapuser             /home            nfs defaults,_netdev 0 0" >> /etc/fstab
        - chmod {{ file_mode }} /etc/fstab
        - mount -a
        - yes | cp /ldapcerts/* /etc/openldap/certs
        - umount /ldapcerts

        - firewall-cmd --permanent --add-port={{ ldap_starttls_port }}/tcp
        - firewall-cmd --permanent --add-port={{ ldap_ssl_port }}/tcp
        - firewall-cmd --reload

        - setenforce 0
        - authselect select sssd with-mkhomedir --force
        - sudo systemctl enable --now oddjobd.service
        - sudo systemctl enable --now sssd
        - setsebool -P authlogin_nsswitch_use_ldap on
        - setsebool -P authlogin_yubikey on
        - sudo systemctl restart sssd
        - systemctl restart sshd

{% endif %}


        # nvidia sdk install
        - /usr/local/bin/install_nvhpc_sdk.sh
        - /usr/local/bin/configure_nvhpc_env.sh
        - echo "Cloud-Init has completed successfully."


================================================
FILE: discovery/roles/configure_ochami/templates/cloud_init/ci-group-login_node_aarch64.yaml.j2
================================================
- name: {{ functional_group_name }}
  description: "{{ functional_group_name }}"

  file:
    encoding: plain
    content: |
      ## template: jinja
      #cloud-config
      merge_how:
      - name: list
        settings: [append]
      - name: dict
        settings: [no_replace, recurse_list]

      users:
        - name: root
          ssh_authorized_keys: "{{ read_ssh_key.stdout }}"
          lock_passwd: false
          hashed_passwd: "{{ hashed_password_output.stdout }}"
        - name: {{ slurm_user }}
          uid: {{ slurm_uid }}
          system: true
          no_create_home: true
          shell: /sbin/nologin
      disable_root: false

      write_files:
        - path: /usr/local/bin/doca-install.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/doca-ofed/doca-install.sh.j2') | indent(12) }}

        - path: /usr/local/bin/configure-ib-network.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/doca-ofed/configure-ib-network.sh.j2') | indent(12) }}

        - path: /usr/local/bin/set-ssh.sh
          permissions: '{{ file_mode_755 }}'
          content: |
            #!/bin/bash
            timedatectl set-timezone {{ hostvars['oim']['oim_timezone'] }}
            localectl set-locale LANG={{ hostvars['localhost']['language'] }}
            sed -i 's/^#PermitRootLogin.*/PermitRootLogin yes/' /etc/ssh/sshd_config
            sed -i 's/^#PasswordAuthentication.*/PasswordAuthentication yes/' /etc/ssh/sshd_config
            sed -i 's/^PasswordAuthentication.*/PasswordAuthentication yes/' /etc/ssh/sshd_config.d/50-cloud-init.conf
            systemctl restart sshd
            default_count=$(ip route | grep -c "^default")
            if [ "$default_count" -le 1 ]; then
                echo "Only one or no default route found. No action needed."
            else
                private_nic=$(ip route | grep "^default via {{ hostvars['localhost']['admin_nic_ip'] }}" | awk '{print $5}')
                # Get all default routes
                ip route | grep '^default' | while read -r line; do
                    nmcli con del "Wired Connection"
                    # Extract NIC name
                    nic=$(echo "$line" | awk '{print $5}')

                    # Add the default route to the connection
                    if [ -n "$nic" ]; then
                        echo "Adding nmcli device $nic"
                        nmcli con add type ethernet ifname "$nic" con-name "$nic" ipv4.method auto
                        if [ "$nic" = "$private_nic" ]; then
                          nmcli con modify "$nic" ipv4.never-default yes
                          nmcli con delete "cloud-init $nic"
                        fi
                        nmcli con up "$nic"
                    else
                        echo "No connection found for device $nic"
                    fi
                done
            fi

        - path: /root/.ssh/config
          permissions: '0600'
          content: |
            Host {{ slurm_control_ssh_patterns }}
                IdentityFile {{ client_mount_path }}/slurm/ssh/oim_rsa
                IdentitiesOnly yes

{% if hostvars['localhost']['openldap_support'] %}
        - path: /etc/sssd/sssd.conf
          owner: root:root
          permissions: '{{ file_mode_600 }}'
          content: |
            {{ lookup('template', 'templates/openldap/sssd.conf.j2') | indent(6) }}

        - path: /usr/local/bin/update_ldap_conf.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/openldap/update_ldap_conf.sh.j2') | indent(12) }}
{% endif %}

{% if hostvars['localhost']['ldms_support'] %}
        - path: /root/ldms_sampler.sh
          owner: root:root
          permissions: '0755'
          content: |
            {{ lookup('template', 'templates/ldms/ldms_sampler.sh.j2') | indent(12) }}
{% endif %}

        - path: /etc/hosts
          append: true
          content: |
{% for key in ip_name_map | sort %}
            {{ ip_name_map[key] }} {{ key }}
{% endfor %}

        - path: /etc/sysconfig/slurmd
          owner: root:root
          permissions: '0644'
          content: |
            SLURMD_OPTIONS="{{ conf_server }}"

        - path: /usr/local/bin/check_slurm_controller_status.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/slurm/check_slurm_controller_status.sh.j2') | indent(12) }}

        - path: /tmp/apptainer_mirror.conf
          permissions: '0644'
          content: |
            {{ lookup('template', 'templates/nodes/apptainer_mirror.conf.j2') | indent(12) }}

      runcmd:
        - /usr/local/bin/set-ssh.sh
        # Ensure Slurm NFS root is mounted at client_mount_path (e.g. /share_omnia)
        - mkdir -p {{ client_mount_path }}/slurm/ssh
        - mkdir -p {{ slurm_slurmd_log_dir_effective }} {{ slurm_slurmd_pid_dir_effective }} {{ slurm_slurmd_spool_dir_effective }} {{ slurm_epilog_dirs_all | join(' ') }} {% for d in slurm_prolog_dirs_all %}{{ d }} {% endfor %}/etc/munge /cert /var/log/track /var/lib/packages /hpc_tools/container_images /hpc_tools/scripts
        - echo "{{ cloud_init_nfs_path }}/$(hostname -s)/var/log/slurm  {{ slurm_slurmd_log_dir_effective }}   nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path }}/$(hostname -s)/var/spool/slurmd      {{ slurm_slurmd_spool_dir_effective }}       nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path }}/$(hostname -s)/etc/slurm/epilog.d     /etc/slurm/epilog.d      nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path }}/$(hostname -s)/etc/munge      /etc/munge       nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ trackfile_nfs_path }}    /var/log/track       nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path}}/hpc_tools/container_images  /hpc_tools/container_images   nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path}}/hpc_tools/scripts  /hpc_tools/scripts   nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path }}/ssh {{ client_mount_path }}/slurm/ssh nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path }}/cert  /cert   nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path }}/packages  /var/lib/packages   nfs defaults,_netdev 0 0" >> /etc/fstab
        - chmod {{ file_mode }} /etc/fstab
        - mount -a
        - cp /cert/pulp_webserver.crt /etc/pki/ca-trust/source/anchors && update-ca-trust
        - sed -i 's/^gpgcheck=1/gpgcheck=0/' /etc/dnf/dnf.conf
        - bash /usr/local/bin/doca-install.sh && bash /usr/local/bin/configure-ib-network.sh
        - /usr/local/bin/check_slurm_controller_status.sh
        - chown -R {{ slurm_user }}:{{ slurm_user }} {{ slurm_slurmd_log_dir_effective }}
        - chown -R {{ slurm_user }}:{{ slurm_user }} {{ slurm_slurmd_pid_dir_effective }}
        - chown -R {{ slurm_user }}:{{ slurm_user }} {{ slurm_slurmd_spool_dir_effective }}
        - chown -R {{ munge_user }}:{{ munge_group }} /etc/munge/munge.key
        - chmod {{ file_mode_755 }} {{ slurm_slurmd_log_dir_effective }} {{ slurm_slurmd_pid_dir_effective }} {{ slurm_slurmd_spool_dir_effective }}
        - chmod {{ file_mode_400 }} /etc/munge/munge.key
        - chmod {{ file_mode_755 }} /etc/slurm/epilog.d/
{% for epath in slurm_epilog_custom_paths %}
        - bash -c 'if [ ! -f "{{ epath }}" ]; then mkdir -p "$(dirname "{{ epath }}")"; printf "#!/bin/bash\n# Custom epilog script placeholder\n# Add your epilog commands here\n" > "{{ epath }}"; chown {{ slurm_user }}:{{ slurm_user }} "{{ epath }}"; chmod {{ file_mode_755 }} "{{ epath }}"; fi'
{% endfor %}
{% for ppath in slurm_prolog_custom_paths %}
        - bash -c 'if [ ! -f "{{ ppath }}" ]; then mkdir -p "$(dirname "{{ ppath }}")"; printf "#!/bin/bash\n# Custom prolog script placeholder\n# Add your prolog commands here\n" > "{{ ppath }}"; chown {{ slurm_user }}:{{ slurm_user }} "{{ ppath }}"; chmod {{ file_mode_755 }} "{{ ppath }}"; fi'
{% endfor %}
        - mkdir -p {{ slurm_slurmd_spool_dir_effective }}
        - chmod {{ file_mode_755 }} {{ slurm_slurmd_spool_dir_effective }}
        - chown -R {{ slurm_user }}:{{ slurm_user }} {{ slurm_slurmd_spool_dir_effective }}
        - setenforce 0
        - systemctl enable firewalld
        - systemctl start firewalld
        - firewall-cmd --permanent --add-service=ssh
        - firewall-cmd --permanent --add-port={{ slurm_conf_dict.SrunPortRange }}/tcp
        - firewall-cmd --permanent --add-port={{ slurm_conf_dict.SrunPortRange }}/udp
        - firewall-cmd --permanent --add-port={{  slurm_conf_dict.SlurmdPort }}/tcp
        - firewall-cmd --permanent --add-port={{ slurm_conf_dict.SlurmdPort }}/udp
        
        # Add PXE network to trusted zone for ORTE communication
        - echo "[INFO] Adding PXE network to trusted zone for ORTE communication"
        - |
          bash -c '
          ADMIN_IP="{{ hostvars['localhost']['admin_nic_ip'] }}"
          NETMASK_BITS="{{ hostvars['localhost']['admin_netmask_bits'] }}"
          
          # Convert IP to integer and calculate network address
          ip_to_int() {
            local IFS=.
            read -r a b c d <<< "$1"
            echo $(( (a << 24) + (b << 16) + (c << 8) + d ))
          }
          
          int_to_ip() {
            local ip=$1
            echo "$(( (ip >> 24) & 255 )).$(( (ip >> 16) & 255 )).$(( (ip >> 8) & 255 )).$(( ip & 255 ))"  
          }
          
          ADMIN_IP_INT=$(ip_to_int "$ADMIN_IP")
          HOST_BITS=$(( 32 - NETMASK_BITS ))
          HOST_MASK=$(( (1 << HOST_BITS) - 1 ))
          NETWORK_MASK=$(( ~HOST_MASK & 0xFFFFFFFF ))
          NETWORK_INT=$(( ADMIN_IP_INT & NETWORK_MASK ))
          NETWORK_IP=$(int_to_ip "$NETWORK_INT")
          
          PXE_SUBNET="$NETWORK_IP/$NETMASK_BITS"
          echo "[INFO] Admin IP: $ADMIN_IP, Netmask: /$NETMASK_BITS, PXE Subnet: $PXE_SUBNET"
          firewall-cmd --zone=trusted --add-source="$PXE_SUBNET" --permanent
          '
        
        - firewall-cmd --reload
        - systemctl enable sshd
        - systemctl start sshd
        - systemctl enable munge
        - systemctl start munge
        - systemctl enable slurmd
        - systemctl start slurmd
        - systemctl daemon-reexec
        - systemctl restart sshd
        - cp /cert/pulp_webserver.crt /etc/pki/ca-trust/source/anchors && update-ca-trust
        - sed -i 's/^gpgcheck=1/gpgcheck=0/' /etc/dnf/dnf.conf
        - mkdir -p /etc/containers/registries.conf.d
        - mv /tmp/apptainer_mirror.conf /etc/containers/registries.conf.d/apptainer_mirror.conf

{% if hostvars['localhost']['openldap_support'] %}
        - /usr/local/bin/update_ldap_conf.sh
        - mkdir /ldapcerts
        - echo "{{ cloud_init_nfs_path_openldap }}/certs                /ldapcerts       nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path_openldap }}/ldapuser             /home            nfs defaults,_netdev 0 0" >> /etc/fstab
        - chmod {{ file_mode }} /etc/fstab
        - mount -a
        - yes | cp /ldapcerts/* /etc/openldap/certs
        - umount /ldapcerts

        - firewall-cmd --permanent --add-port={{ ldap_starttls_port }}/tcp
        - firewall-cmd --permanent --add-port={{ ldap_ssl_port }}/tcp
        - firewall-cmd --reload

        - setenforce 0
        - authselect select sssd with-mkhomedir --force
        - sudo systemctl enable --now oddjobd.service
        - sudo systemctl enable --now sssd
        - setsebool -P authlogin_nsswitch_use_ldap on
        - setsebool -P authlogin_yubikey on
        - sudo systemctl restart sssd
        - systemctl restart sshd

{% endif %}

{% if hostvars['localhost']['ldms_support'] %}
        - echo " Starting LDMS setup " | tee -a /var/log/ldms-cloudinit.log

        # Add NFS entry and mount
        - mkdir -p {{ client_mount_path }}
        - echo "{{ cloud_init_slurm_nfs_path }} {{ client_mount_path }} nfs defaults,_netdev 0 0" >> /etc/fstab
        - mount -a

        - /root/ldms_sampler.sh
{% endif %}
        - echo "Cloud-Init has completed successfully."


================================================
FILE: discovery/roles/configure_ochami/templates/cloud_init/ci-group-login_node_x86_64.yaml.j2
================================================
- name: {{ functional_group_name }}
  description: "{{ functional_group_name }}"

  file:
    encoding: plain
    content: |
      ## template: jinja
      #cloud-config
      merge_how:
      - name: list
        settings: [append]
      - name: dict
        settings: [no_replace, recurse_list]

      users:
        - name: root
          ssh_authorized_keys: "{{ read_ssh_key.stdout }}"
          lock_passwd: false
          hashed_passwd: "{{ hashed_password_output.stdout }}"
        - name: {{ slurm_user }}
          uid: {{ slurm_uid }}
          system: true
          no_create_home: true
          shell: /sbin/nologin
      disable_root: false

      write_files:
        - path: /usr/local/bin/doca-install.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/doca-ofed/doca-install.sh.j2') | indent(12) }}

        - path: /usr/local/bin/configure-ib-network.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/doca-ofed/configure-ib-network.sh.j2') | indent(12) }}

        - path: /usr/local/bin/set-ssh.sh
          permissions: '{{ file_mode_755 }}'
          content: |
            #!/bin/bash
            timedatectl set-timezone {{ hostvars['oim']['oim_timezone'] }}
            localectl set-locale LANG={{ hostvars['localhost']['language'] }}
            sed -i 's/^#PermitRootLogin.*/PermitRootLogin yes/' /etc/ssh/sshd_config
            sed -i 's/^#PasswordAuthentication.*/PasswordAuthentication yes/' /etc/ssh/sshd_config
            sed -i 's/^PasswordAuthentication.*/PasswordAuthentication yes/' /etc/ssh/sshd_config.d/50-cloud-init.conf
            systemctl restart sshd
            default_count=$(ip route | grep -c "^default")
            if [ "$default_count" -le 1 ]; then
                echo "Only one or no default route found. No action needed."
            else
                private_nic=$(ip route | grep "^default via {{ hostvars['localhost']['admin_nic_ip'] }}" | awk '{print $5}')
                # Get all default routes
                ip route | grep '^default' | while read -r line; do
                    nmcli con del "Wired Connection"
                    # Extract NIC name
                    nic=$(echo "$line" | awk '{print $5}')

                    # Add the default route to the connection
                    if [ -n "$nic" ]; then
                        echo "Adding nmcli device $nic"
                        nmcli con add type ethernet ifname "$nic" con-name "$nic" ipv4.method auto
                        if [ "$nic" = "$private_nic" ]; then
                          nmcli con modify "$nic" ipv4.never-default yes
                          nmcli con delete "cloud-init $nic"
                        fi
                        nmcli con up "$nic"
                    else
                        echo "No connection found for device $nic"
                    fi
                done
            fi
        
        - path: /root/.ssh/config
          permissions: '0600'
          content: |
            Host {{ slurm_control_ssh_patterns }}
                IdentityFile {{ client_mount_path }}/slurm/ssh/oim_rsa
                IdentitiesOnly yes

{% if hostvars['localhost']['openldap_support'] %}
        - path: /etc/sssd/sssd.conf
          owner: root:root
          permissions: '{{ file_mode_600 }}'
          content: |
            {{ lookup('template', 'templates/openldap/sssd.conf.j2') | indent(6) }}

        - path: /usr/local/bin/update_ldap_conf.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/openldap/update_ldap_conf.sh.j2') | indent(12) }}
{% endif %}
{% if hostvars['localhost']['ldms_support'] %}
        - path: /root/ldms_sampler.sh
          owner: root:root
          permissions: '0755'
          content: |
            {{ lookup('template', 'templates/ldms/ldms_sampler.sh.j2') | indent(12) }}
{% endif %}

        - path: /etc/hosts
          append: true
          content: |
{% for key in ip_name_map | sort %}
            {{ ip_name_map[key] }} {{ key }}
{% endfor %}

        - path: /etc/sysconfig/slurmd
          owner: root:root
          permissions: '0644'
          content: |
            SLURMD_OPTIONS="{{ conf_server }}"

        - path: /usr/local/bin/check_slurm_controller_status.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/slurm/check_slurm_controller_status.sh.j2') | indent(12) }}

        - path: /tmp/apptainer_mirror.conf
          permissions: '0644'
          content: |
            {{ lookup('template', 'templates/nodes/apptainer_mirror.conf.j2') | indent(12) }}

      runcmd:
        - /usr/local/bin/set-ssh.sh
        # Ensure Slurm NFS root is mounted at client_mount_path (e.g. /share_omnia)
        - mkdir -p {{ client_mount_path }}/slurm/ssh
        - mkdir -p {{ slurm_slurmd_log_dir_effective }} {{ slurm_slurmd_pid_dir_effective }} {{ slurm_slurmd_spool_dir_effective }} {{ slurm_epilog_dirs_all | join(' ') }} {% for d in slurm_prolog_dirs_all %}{{ d }} {% endfor %}/etc/munge /cert /var/log/track /var/lib/packages /hpc_tools/container_images /hpc_tools/scripts
        - echo "{{ cloud_init_nfs_path }}/cert  /cert   nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path }}/$(hostname -s)/var/log/slurm  {{ slurm_slurmd_log_dir_effective }}   nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path }}/$(hostname -s)/var/spool/slurmd      {{ slurm_slurmd_spool_dir_effective }}       nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path }}/$(hostname -s)/etc/slurm/epilog.d     /etc/slurm/epilog.d      nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path }}/$(hostname -s)/etc/munge      /etc/munge       nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ trackfile_nfs_path }}    /var/log/track       nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path}}/hpc_tools/container_images  /hpc_tools/container_images   nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path}}/hpc_tools/scripts  /hpc_tools/scripts   nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path }}/ssh {{ client_mount_path }}/slurm/ssh nfs defaults,_netdev 0 0" >> /etc/fstab

        - echo "{{ cloud_init_nfs_path }}/cert  /cert   nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path }}/packages  /var/lib/packages   nfs defaults,_netdev 0 0" >> /etc/fstab

        - chmod {{ file_mode }} /etc/fstab
        - mount -a
        - cp /cert/pulp_webserver.crt /etc/pki/ca-trust/source/anchors && update-ca-trust
        - sed -i 's/^gpgcheck=1/gpgcheck=0/' /etc/dnf/dnf.conf
        - bash /usr/local/bin/doca-install.sh && bash /usr/local/bin/configure-ib-network.sh
        - /usr/local/bin/check_slurm_controller_status.sh
        - chown -R {{ slurm_user }}:{{ slurm_user }} {{ slurm_slurmd_log_dir_effective }}
        - chown -R {{ slurm_user }}:{{ slurm_user }} {{ slurm_slurmd_pid_dir_effective }}
        - chown -R {{ slurm_user }}:{{ slurm_user }} {{ slurm_slurmd_spool_dir_effective }}
        - chown -R {{ munge_user }}:{{ munge_group }} /etc/munge/munge.key
        - chmod {{ file_mode_755 }} {{ slurm_slurmd_log_dir_effective }} {{ slurm_slurmd_pid_dir_effective }} {{ slurm_slurmd_spool_dir_effective }}
        - chmod {{ file_mode_400 }} /etc/munge/munge.key
        - chmod {{ file_mode_755 }} /etc/slurm/epilog.d/
        - chmod {{ file_mode_755 }} /etc/slurm/epilog.d/logout_user.sh
{% for epath in slurm_epilog_custom_paths %}
        - bash -c 'if [ ! -f "{{ epath }}" ]; then mkdir -p "$(dirname "{{ epath }}")"; printf "#!/bin/bash\n# Custom epilog script placeholder\n# Add your epilog commands here\n" > "{{ epath }}"; chown {{ slurm_user }}:{{ slurm_user }} "{{ epath }}"; chmod {{ file_mode_755 }} "{{ epath }}"; fi'
{% endfor %}
{% for ppath in slurm_prolog_custom_paths %}
        - bash -c 'if [ ! -f "{{ ppath }}" ]; then mkdir -p "$(dirname "{{ ppath }}")"; printf "#!/bin/bash\n# Custom prolog script placeholder\n# Add your prolog commands here\n" > "{{ ppath }}"; chown {{ slurm_user }}:{{ slurm_user }} "{{ ppath }}"; chmod {{ file_mode_755 }} "{{ ppath }}"; fi'
{% endfor %}
        - mkdir -p {{ slurm_slurmd_spool_dir_effective }}
        - chmod {{ file_mode_755 }} {{ slurm_slurmd_spool_dir_effective }}
        - chown -R {{ slurm_user }}:{{ slurm_user }} {{ slurm_slurmd_spool_dir_effective }}
        - setenforce 0
        - systemctl enable firewalld
        - systemctl start firewalld
        - firewall-cmd --permanent --add-service=ssh
        - firewall-cmd --permanent --add-port={{ slurm_conf_dict.SrunPortRange }}/tcp
        - firewall-cmd --permanent --add-port={{ slurm_conf_dict.SrunPortRange }}/udp
        - firewall-cmd --permanent --add-port={{  slurm_conf_dict.SlurmdPort }}/tcp
        - firewall-cmd --permanent --add-port={{ slurm_conf_dict.SlurmdPort }}/udp
        
        # Add PXE network to trusted zone for ORTE communication
        - echo "[INFO] Adding PXE network to trusted zone for ORTE communication"
        - |
          bash -c '
          ADMIN_IP="{{ hostvars['localhost']['admin_nic_ip'] }}"
          NETMASK_BITS="{{ hostvars['localhost']['admin_netmask_bits'] }}"
          
          # Convert IP to integer and calculate network address
          ip_to_int() {
            local IFS=.
            read -r a b c d <<< "$1"
            echo $(( (a << 24) + (b << 16) + (c << 8) + d ))
          }
          
          int_to_ip() {
            local ip=$1
            echo "$(( (ip >> 24) & 255 )).$(( (ip >> 16) & 255 )).$(( (ip >> 8) & 255 )).$(( ip & 255 ))"  
          }
          
          ADMIN_IP_INT=$(ip_to_int "$ADMIN_IP")
          HOST_BITS=$(( 32 - NETMASK_BITS ))
          HOST_MASK=$(( (1 << HOST_BITS) - 1 ))
          NETWORK_MASK=$(( ~HOST_MASK & 0xFFFFFFFF ))
          NETWORK_INT=$(( ADMIN_IP_INT & NETWORK_MASK ))
          NETWORK_IP=$(int_to_ip "$NETWORK_INT")
          
          PXE_SUBNET="$NETWORK_IP/$NETMASK_BITS"
          echo "[INFO] Admin IP: $ADMIN_IP, Netmask: /$NETMASK_BITS, PXE Subnet: $PXE_SUBNET"
          firewall-cmd --zone=trusted --add-source="$PXE_SUBNET" --permanent
          '
        
        - firewall-cmd --reload
        - systemctl enable sshd
        - systemctl start sshd
        - systemctl enable munge
        - systemctl start munge
        - systemctl enable slurmd
        - systemctl start slurmd
        - systemctl daemon-reexec
        - systemctl restart sshd
        - cp /cert/pulp_webserver.crt /etc/pki/ca-trust/source/anchors && update-ca-trust
        - sed -i 's/^gpgcheck=1/gpgcheck=0/' /etc/dnf/dnf.conf
        - mkdir -p /etc/containers/registries.conf.d
        - mv /tmp/apptainer_mirror.conf /etc/containers/registries.conf.d/apptainer_mirror.conf

{% if hostvars['localhost']['openldap_support'] %}
        - /usr/local/bin/update_ldap_conf.sh
        - mkdir /ldapcerts
        - echo "{{ cloud_init_nfs_path_openldap }}/certs                /ldapcerts       nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path_openldap }}/ldapuser             /home            nfs defaults,_netdev 0 0" >> /etc/fstab
        - chmod {{ file_mode }} /etc/fstab
        - mount -a
        - yes | cp /ldapcerts/* /etc/openldap/certs
        - umount /ldapcerts

        - firewall-cmd --permanent --add-port={{ ldap_starttls_port }}/tcp
        - firewall-cmd --permanent --add-port={{ ldap_ssl_port }}/tcp
        - firewall-cmd --reload

        - setenforce 0
        - authselect select sssd with-mkhomedir --force
        - sudo systemctl enable --now oddjobd.service
        - sudo systemctl enable --now sssd
        - setsebool -P authlogin_nsswitch_use_ldap on
        - setsebool -P authlogin_yubikey on
        - sudo systemctl restart sssd
        - systemctl restart sshd

{% endif %}

{% if hostvars['localhost']['ldms_support'] %}
        - echo " Starting LDMS setup " | tee -a /var/log/ldms-cloudinit.log

        # Add NFS entry and mount
        - mkdir -p {{ client_mount_path }}
        - echo "{{ cloud_init_slurm_nfs_path }} {{ client_mount_path }} nfs defaults,_netdev 0 0" >> /etc/fstab
        - mount -a

        - /root/ldms_sampler.sh
{% endif %}
        - echo "Cloud-Init has completed successfully."


================================================
FILE: discovery/roles/configure_ochami/templates/cloud_init/ci-group-service_kube_control_plane_first_x86_64.yaml.j2
================================================
- name: {{ functional_group_name }}
  description: "{{ functional_group_name }}"
  file:
    encoding: plain
    content: |
      ## template: jinja
      #cloud-config

      merge_how:
      - name: list
        settings: [append]
      - name: dict
        settings: [no_replace, recurse_list]

      users:
        - name: root
          ssh_authorized_keys: "{{ read_ssh_key.stdout }}"
          lock_passwd: false
          hashed_passwd: "{{ hashed_password_output.stdout }}"
      disable_root: false

      write_files:
        - path: /usr/local/bin/doca-install.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/doca-ofed/doca-install.sh.j2') | indent(12) }}

        - path: /usr/local/bin/configure-ib-network.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/doca-ofed/configure-ib-network.sh.j2') | indent(12) }}

        - path: /usr/local/bin/set-ssh.sh
          permissions: '0755'
          content: |
            #!/bin/bash
            timedatectl set-timezone {{ hostvars['oim']['oim_timezone'] }}
            sed -i 's/^#PermitRootLogin.*/PermitRootLogin yes/' /etc/ssh/sshd_config
            sed -i 's/^#PasswordAuthentication.*/PasswordAuthentication yes/' /etc/ssh/sshd_config
            sed -i 's/^PasswordAuthentication.*/PasswordAuthentication yes/' /etc/ssh/sshd_config.d/50-cloud-init.conf
            systemctl restart sshd
            default_count=$(ip route | grep -c "^default")
            if [ "$default_count" -le 1 ]; then
                echo "Only one or no default route found. No action needed."
            else
                private_nic=$(ip route | grep "^default via {{ hostvars['localhost']['admin_nic_ip'] }}" | awk '{print $5}')
                # Get all default routes
                ip route | grep '^default' | while read -r line; do
                    nmcli con del "Wired Connection"
                    # Extract NIC name
                    nic=$(echo "$line" | awk '{print $5}')

                    # Add the default route to the connection
                    if [ -n "$nic" ]; then
                        echo "Adding nmcli device $nic"
                        nmcli con add type ethernet ifname "$nic" con-name "$nic" ipv4.method auto
                        if [ "$nic" = "$private_nic" ]; then
                          nmcli con modify "$nic" ipv4.never-default yes
                          nmcli con delete "cloud-init $nic"
                        fi
                        nmcli con up "$nic"
                    else
                        echo "No connection found for device $nic"
                    fi
                done
            fi
        
        - path: /root/.ssh/config
          permissions: '0600'
          content: |
            Host {{ k8s_control_ssh_patterns }}
                IdentityFile {{ k8s_client_mount_path }}/ssh/oim_rsa
                IdentitiesOnly yes

        - path: /etc/chrony.conf
          permissions: '0644'
          content: |
            server {{ cluster_boot_ip }} iburst

            driftfile /var/lib/chrony/drift
            rtcsync
            makestep 1.0 3
            logdir /var/log/chrony
            cmdport 0

        - path: /etc/modules-load.d/k8s.conf
          content: |
            br_netfilter
            overlay
            nf_conntrack
            vxlan
          permissions: '0644'

        - path: /etc/sysctl.d/k8s.conf
          content: |
            net.bridge.bridge-nf-call-iptables=1
            net.bridge.bridge-nf-call-ip6tables=1
            net.ipv4.ip_forward=1
            vm.overcommit_memory=1
            kernel.panic=10
          permissions: '0644'

        - path: /etc/fstab
          content: |
            {{ k8s_nfs_server_ip }}:{{ k8s_server_share_path }}   {{ k8s_client_mount_path }}        nfs    noatime,nolock     0 0
            {{ k8s_nfs_server_ip }}:{{ k8s_server_share_path }}/{% raw %}{{ ds.meta_data.instance_data.local_ipv4 }}{% endraw %}/etcd      /var/lib/etcd        nfs noatime,nolock 0 0
            {{ k8s_nfs_server_ip }}:{{ k8s_server_share_path }}/{% raw %}{{ ds.meta_data.instance_data.local_ipv4 }}{% endraw %}/kubelet   /var/lib/kubelet     nfs noatime,nolock 0 0
            {{ k8s_nfs_server_ip }}:{{ k8s_server_share_path }}/{% raw %}{{ ds.meta_data.instance_data.local_ipv4 }}{% endraw %}/kubernetes   /etc/kubernetes      nfs noatime,nolock 0 0
            {{ k8s_nfs_server_ip }}:{{ k8s_server_share_path }}/{% raw %}{{ ds.meta_data.instance_data.local_ipv4 }}{% endraw %}/pod-logs   /var/log/pods      nfs noatime,nolock 0 0
            {{ k8s_nfs_server_ip }}:{{ k8s_server_share_path }}/packages   /var/lib/packages        nfs    noatime,nolock     0 0
            tmpfs   /tmp/crio-storage   tmpfs   size={{ k8s_crio_storage_size }},noatime,nodev,nosuid   0 0
          permissions: '0644'

        - path: /etc/containers/storage.conf
          content: |
            [storage]
            driver = "overlay"
            runroot = "/var/run/containers/storage"
            graphroot = "/tmp/crio-storage"
            [storage.options.overlay]
            mount_program = "/usr/bin/fuse-overlayfs"
          permissions: '0644'

        - path: /tmp/crio.conf
          permissions: '0644'
          content: |
            unqualified-search-registries = ["{{ pulp_mirror }}"]

            [[registry]]
            prefix = "docker.io"
            location = "registry-1.docker.io"
            [[registry.mirror]]
            location = "{{ pulp_mirror }}"

            [[registry]]
            prefix = "ghcr.io"
            location = "ghcr.io"
            [[registry.mirror]]
            location = "{{ pulp_mirror }}"

            [[registry]]
            prefix = "quay.io"
            location = "quay.io"
            [[registry.mirror]]
            location = "{{ pulp_mirror }}"

            [[registry]]
            prefix = "registry.k8s.io"
            location = "registry.k8s.io"
            [[registry.mirror]]
            location = "{{ pulp_mirror }}"

            [[registry]]
            prefix = "nvcr.io"
            location = "nvcr.io"
            [[registry.mirror]]
            location = "{{ pulp_mirror }}"

            [[registry]]
            prefix = "public.ecr.aws"
            location = "public.ecr.aws"
            [[registry.mirror]]
            location = "{{ pulp_mirror }}"

            [[registry]]
            prefix = "gcr.io"
            location = "gcr.io"
            [[registry.mirror]]
            location = "{{ pulp_mirror }}"
{% if user_registry | default([]) | length > 0 %}
{% for registry in user_registry %}

            [[registry]]
            prefix = "{{ registry.host }}"
            location = "{{ registry.host }}"
            [[registry.mirror]]
            location = "{{ pulp_mirror }}"
{% endfor %}
{% endif %}

        - path: /tmp/kube-vip.yaml
          owner: root:root
          permissions: '0644'
          content: |
            apiVersion: v1
            kind: Pod
            metadata:
              creationTimestamp: null
              name: kube-vip
              namespace: kube-system
              uid: kube-vip-pod
            spec:
              containers:
              - args:
                - manager
                env:
                - name: vip_arp
                  value: "true"
                - name: port
                  value: "6443"
                - name: vip_nodename
                  valueFrom:
                    fieldRef:
                      fieldPath: spec.nodeName
                - name: vip_interface
                  value: vip_interface
                - name: vip_cidr
                  value: "{{ admin_netmask_bits }}"
                - name: dns_mode
                  value: first
                - name: cp_enable
                  value: "true"
                - name: cp_namespace
                  value: kube-system
                - name: svc_enable
                  value: "true"
                - name: svc_leasename
                  value: plndr-svcs-lock
                - name: vip_leaderelection
                  value: "true"
                - name: vip_leasename
                  value: plndr-cp-lock
                - name: vip_leaseduration
                  value: "5"
                - name: vip_renewdeadline
                  value: "3"
                - name: vip_retryperiod
                  value: "1"
                - name: vip_address
                  value: {{ kube_vip }}
                - name: prometheus_server
                  value: :2112
                image: ghcr.io/kube-vip/kube-vip:v0.8.9
                imagePullPolicy: IfNotPresent
                name: kube-vip
                resources: {}
                securityContext:
                  capabilities:
                    add:
                    - NET_ADMIN
                    - NET_RAW
                volumeMounts:
                - mountPath: /etc/kubernetes/admin.conf
                  name: kubeconfig
              hostAliases:
              - hostnames:
                - kubernetes
                ip: 127.0.0.1
              hostNetwork: true
              dnsPolicy: ClusterFirstWithHostNet
              volumes:
              - hostPath:
                  path: /etc/kubernetes/admin.conf
                name: kubeconfig
            status: {}

        - path: /usr/local/bin/k8s-cluster-setup.sh
          permissions: '0755'
          content: |
            #!/bin/bash
            set -e
            kubeadm init --kubernetes-version={{ service_k8s_version }} \
              --pod-network-cidr={{ k8s_pod_network_cidr }} \
              --service-cidr={{ k8s_service_addresses }} \
              --apiserver-advertise-address={% raw %}{{ ds.meta_data.instance_data.local_ipv4 }}{% endraw %} \
              --node-name {% raw %}{{ ds.meta_data.instance_data.local_ipv4 }}{% endraw %} \
              --cri-socket=unix:///var/run/crio/crio.sock \
              --control-plane-endpoint={% raw %}{{ ds.meta_data.instance_data.local_ipv4 }}{% endraw %}:6443 \
              --apiserver-cert-extra-sans {{ kube_vip }}
        
        - path: /tmp/generate-control-plane-join.sh
          permissions: '0744'
          content: |
            #!/bin/bash
            set -e
            # Shared mount path where the control-plane join command will be saved
            K8S_CLIENT_MOUNT_PATH="{{ k8s_client_mount_path }}"
            mkdir -p "$K8S_CLIENT_MOUNT_PATH"
            echo "Generating Kubernetes control-plane join command..."
            # Generate certificate key and control plane join command
            CERT_KEY=$(kubeadm init phase upload-certs --upload-certs | tail -1 | tr -d '\r\n ')
            if [ -n "$CERT_KEY" ]; then
                CONTROL_PLANE_JOIN_CMD=$(kubeadm token create --ttl 0 --print-join-command --certificate-key "$CERT_KEY")
                echo "$CONTROL_PLANE_JOIN_CMD" > "${K8S_CLIENT_MOUNT_PATH}/control-plane-join-command.sh"
                chmod 644 "${K8S_CLIENT_MOUNT_PATH}/control-plane-join-command.sh"
                echo "Saved control-plane join command to: ${K8S_CLIENT_MOUNT_PATH}/control-plane-join-command.sh"
            else
                echo "ERROR: Certificate key is empty! Cannot generate control-plane join command."
                exit 1
            fi
            echo "Control-plane join script is ready. You can rerun this script anytime to refresh the command."

        - path: /usr/local/bin/install-helm.sh
          permissions: '0755'
          content: |
            #!/bin/bash
            set -e
            HELM_VERSION="v3.19.0"
            ARCH="amd64"
            cp {{ k8s_client_mount_path }}/helm/linux-${ARCH}/helm /usr/local/bin/helm
            chmod +x /usr/local/bin/helm

            # Optional: Set up bash completion
            /usr/local/bin/helm completion bash > /etc/bash_completion.d/helm.sh
            chmod 0755 /etc/bash_completion.d/helm.sh

        - path: /tmp/ipaddress_pool.yaml
          owner: root:root
          permissions: '0644'
          content: |
            apiVersion: metallb.io/v1beta1
            kind: IPAddressPool
            metadata:
              name: first-pool
              namespace: metallb-system
            spec:
              addresses:
              - {{ pod_external_ip_range }}

        - path: /tmp/l2advertisement.yaml
          owner: root:root
          permissions: '0644'
          content: |
            apiVersion: metallb.io/v1beta1
            kind: L2Advertisement
            metadata:
              name: default
              namespace: metallb-system
            spec:
              ipAddressPools:
              - first-pool

{% if hostvars['localhost']['idrac_telemetry_support'] or hostvars['localhost']['ldms_support'] %}
        - path: /root/telemetry.sh
          owner: root:root
          permissions: '0755'
          content: |
            {{ lookup('template', 'templates/telemetry/telemetry.sh.j2') | indent(12) }}
{% endif %}

      runcmd:
        - /usr/local/bin/set-ssh.sh
        - "systemctl enable chronyd"
        - "systemctl restart chronyd"
        - "chronyc sources"
        - "chronyc -a makestep"
        - sudo swapoff -a
        - sudo sed -i '/ swap / s/^/#/' /etc/fstab
        - sudo setenforce 0 || true
        - sudo sed -i 's/^SELINUX=enforcing/SELINUX=permissive/' /etc/selinux/config
        
        # Enable and start firewalld
        - systemctl enable firewalld
        - systemctl start firewalld

        # Open essential ports
        - firewall-cmd --permanent --add-port=22/tcp
        - firewall-cmd --permanent --add-port=6443/tcp
        - firewall-cmd --permanent --add-port=2379-2380/tcp
        - firewall-cmd --permanent --add-port=10250/tcp
        - firewall-cmd --permanent --add-port=10251/tcp
        - firewall-cmd --permanent --add-port=10252/tcp
        - firewall-cmd --permanent --add-port=10257/tcp
        - firewall-cmd --permanent --add-port=10259/tcp

        # CNI-related ports if running workloads on control plane (NodePort, CNI, etc.)
        - firewall-cmd --permanent --add-port=30000-32767/tcp
        - firewall-cmd --permanent --add-port=179/tcp
        - firewall-cmd --permanent --add-port=4789/udp
        - firewall-cmd --permanent --add-port=5473/tcp
        - firewall-cmd --permanent --add-port=51820/udp
        - firewall-cmd --permanent --add-port=51821/udp
        - firewall-cmd --permanent --add-port=9100/tcp
        - firewall-cmd --permanent --add-port=7472/tcp
        - firewall-cmd --permanent --add-port=7472/udp
        - firewall-cmd --permanent --add-port=7946/tcp
        - firewall-cmd --permanent --add-port=7946/udp
        - firewall-cmd --permanent --add-port=9090/tcp
        - firewall-cmd --permanent --add-port=8080/tcp
        
        # Enable services
        - firewall-cmd --permanent --add-service=http
        - firewall-cmd --permanent --add-service=https

        # Add pod/service networks
        - firewall-cmd --permanent --zone=trusted --add-source={{ k8s_service_addresses }}
        - firewall-cmd --permanent --zone=trusted --add-source={{ k8s_pod_network_cidr }}
        
        # Set default zone to trusted
        - firewall-cmd --set-default-zone=trusted
        
        # Reload the firewall rules
        - firewall-cmd --reload

        - sudo modprobe br_netfilter || true
        - sudo modprobe overlay || true
        - sudo modprobe nf_conntrack || true
        - sudo modprobe vxlan || true
        - sysctl --system
        - mkdir -p /tmp/crio-storage {{ k8s_client_mount_path }} /var/lib/etcd  /var/lib/kubelet /etc/kubernetes /var/log/pods /var/lib/packages
        - |
          tmpfile=$(mktemp)
          # Extract the first 'search' line only (ignore duplicates)
          search_line=$(grep '^search' /etc/resolv.conf | head -n1)
          [ -n "$search_line" ] && echo "$search_line" > "$tmpfile"

          # Add your new nameserver entries
          {% for ns in dns %}
          echo "nameserver {{ ns }}" >> "$tmpfile"
          {% endfor %}

          # Add remaining lines except search and empty lines
          grep -v '^search' /etc/resolv.conf | grep -v '^$' >> "$tmpfile"

          # Remove duplicate lines
          awk '!seen[$0]++' "$tmpfile" > /etc/resolv.conf
        - |
          if command -v chattr >/dev/null 2>&1; then
            chattr +i /etc/resolv.conf || true
          fi
        - mount -a
        - cp {{ k8s_client_mount_path }}/pulp_webserver.crt /etc/pki/ca-trust/source/anchors
        - update-ca-trust extract
        - sed -i 's/^gpgcheck=1/gpgcheck=0/' /etc/dnf/dnf.conf
        - bash /usr/local/bin/doca-install.sh && bash /usr/local/bin/configure-ib-network.sh
        - mkdir -p /etc/containers/registries.conf.d
        - mv /tmp/crio.conf /etc/containers/registries.conf.d/crio.conf
        - systemctl start crio.service
        - systemctl enable crio.service
        - sudo systemctl enable --now kubelet
        - mv /tmp/generate-control-plane-join.sh {{ k8s_client_mount_path }}
        - kubeadm config images pull --kubernetes-version={{ service_k8s_version }}
{% set role_name = 'service_kube_control_plane_first' %}
{% include 'pull_additional_images.yaml.j2' %}
        - echo "Installing helm"
        - /usr/local/bin/install-helm.sh

        - |
          echo "Installing Necessary Python pip packages"
          python3 -m ensurepip

          PACKAGES=({% for pkg in k8s_pip_packages %}"{{ pkg }}"{% if not loop.last %} {% endif %}{% endfor %})

          for pkg in "${PACKAGES[@]}"; do
              echo "Installing $pkg from offline repo..."
              pip3 install "$pkg" \
                  --find-links="{{ offline_pip_module_path }}/${pkg}/" \
                  --trusted-host "{{ pulp_server_ip }}" \
                  --no-index
          done
          MARKER="/etc/kubernetes/.cluster_initialized"
          export KUBECONFIG="/etc/kubernetes/admin.conf"
          if [ ! -f "$MARKER" ]; then
            # FIRST BOOT - CLUSTER INIT
            # -- All the commands below this line should be run ONCE ONLY:
            echo "Initial boot - initializing and setting up service_kube_control_plane_first_x86_64"
            mv /tmp/ipaddress_pool.yaml {{ k8s_client_mount_path }}/metallb/ipaddress_pool.yaml
            mv /tmp/l2advertisement.yaml {{ k8s_client_mount_path }}/metallb/l2advertisement.yaml
            # Setup Kubernetes cluster
            rm -rf /var/lib/etcd/*  /var/lib/kubelet/* /etc/kubernetes/*
            rm -rf /var/lib/etcd/.*  /var/lib/kubelet/.* /etc/kubernetes/.*
            #!/bin/bash
            NODE_IP="{% raw %}{{ ds.meta_data.instance_data.local_ipv4 }}{% endraw %}"
            # Find the interface with this IP
            VIP_IFACE=$(ip -o addr show | awk -v ip="$NODE_IP" '$4 ~ ip {print $2}')
            # Replace the vip_interface placeholder in the yaml
            sed -i "s/value: vip_interface/value: ${VIP_IFACE}/" /tmp/kube-vip.yaml
            mkdir -p /etc/kubernetes/manifests/
            cp /tmp/kube-vip.yaml /etc/kubernetes/manifests/kube-vip.yaml

            /usr/local/bin/k8s-cluster-setup.sh || true
            mkdir -p $HOME/.kube
            cp -f /etc/kubernetes/admin.conf $HOME/.kube/config
            chown $(id -u):$(id -g) $HOME/.kube/config
  
            echo "Updating strictARP to true in kube-proxy configmap"
            kubectl get configmap kube-proxy -n kube-system -o yaml | \
            sed -e "s/strictARP: false/strictARP: true/" | \
            kubectl apply -f - -n kube-system
            cp {{ k8s_client_mount_path }}/calico/{{ calico_package }}.yml {{ k8s_client_mount_path }}/calico/updated-{{ calico_package }}.yml

            CALICO_YAML="{{ k8s_client_mount_path }}/calico/updated-{{ calico_package }}.yml"
            ADMIN_NIC_CIDR="{{ admin_nic_cidr }}"

            # Only add if not already present
            if ! grep -q 'name: IP_AUTODETECTION_METHOD' "$CALICO_YAML"; then
              sed -i '/value: "autodetect"/a\            - name: IP_AUTODETECTION_METHOD\n              value: "cidr='"$ADMIN_NIC_CIDR"'"' "$CALICO_YAML"
              echo "IP_AUTODETECTION_METHOD set to $ADMIN_NIC_CIDR in $CALICO_YAML"
            else
              echo "IP_AUTODETECTION_METHOD already present in $CALICO_YAML"
            fi
            
            # To apply the Calico manifest
            kubectl apply -f "$CALICO_YAML"

            export KUBECONFIG=/etc/kubernetes/admin.conf
            echo "Waiting for one Ready control plane node ..."
            # Loop until we have at least one control plane node with status Ready
            while true; do
              control_plane_ready=$(kubectl get nodes -l node-role.kubernetes.io/control-plane="" --no-headers 2>/dev/null | awk '$2=="Ready"' | wc -l)
              if [ "$control_plane_ready" -ge 1 ]; then
                echo "Found $control_plane_ready Ready control plane node(s)!"
                break
              else
                echo "No Ready control plane node yet, waiting 5s ..."
                sleep 5
              fi
            done
            # Wait for all pods in all namespaces to be ready (status=Running or Completed)
            echo "Waiting for all pods to be Ready (Running/Completed)..."
            while true; do
              not_ready=$(kubectl get pods --all-namespaces --no-headers 2>/dev/null | awk '{ print $4 }' | grep -vE '^(Running|Completed)$' | wc -l)
              if [ "${not_ready}" -eq 0 ]; then
                echo "All pods are Running or Completed."
                break
              else
                echo "$not_ready pods not yet ready, waiting 5s ..."
                sleep 5
              fi
            done

            set -e
            echo "Updating the arguments for kube-controller-manager"
            MANIFEST="/etc/kubernetes/manifests/kube-controller-manager.yaml"
            BACKUP="/tmp/kube-controller-manager.yaml"

            ARGS=(
              "--node-monitor-period=5s"
              "--node-monitor-grace-period=40s"
              "--node-eviction-rate=1"
              "--secondary-node-eviction-rate=1"
              "--terminated-pod-gc-threshold=50"
            )

            echo "Backing up kube-controller-manager manifest..."
            cp -a "$MANIFEST" "$BACKUP"
            
            # -----------------------------------------
            # Update --controllers= argument
            # -----------------------------------------
            OLD="--controllers=*,bootstrapsigner,tokencleaner"
            NEW="--controllers=*,nodeipam,nodelifecycle,bootstrapsigner,tokencleaner"

            echo "Checking and updating controllers argument in: $BACKUP"

            # Detect ANY existing --controllers= line (with or without OLD)
            if grep -Fq -- "--controllers=" "$BACKUP"; then
              echo "Existing controllers line found. Updating..."
              # Replace entire existing controllers argument safely
              sed -i "s|.*--controllers=.*|    - $NEW|" "$BACKUP"
            else
              echo "No controllers line found. Adding new one..."
              # Insert after the kube-controller-manager entry
              sed -i "/- kube-controller-manager/a \ \ \ \ - $NEW" "$BACKUP"
            fi


            for ARG in "${ARGS[@]}"; do
              if grep -Fq -- "$ARG" "$BACKUP"; then
                echo "Already present: $ARG"
              else
                echo "Adding: $ARG"
                sed -i "/- kube-controller-manager/a \ \ \ \ - $ARG" "$BACKUP"
              fi
            done
            yes | cp -i  "$BACKUP" "$MANIFEST"


            echo "All arguments processed successfully."
            echo "kubelet will auto-restart kube-controller-manager within 30-60 seconds."

            echo "Waiting for Kubernetes API..."
            until kubectl get nodes >/dev/null 2>&1; do
              sleep 10
            done
            echo "Updating the kubelet arguments."
            sed -i 's/^shutdownGracePeriod:.*/shutdownGracePeriod: 30s/' /var/lib/kubelet/config.yaml
            sed -i 's/^shutdownGracePeriodCriticalPods:.*/shutdownGracePeriodCriticalPods: 10s/' /var/lib/kubelet/config.yaml
            systemctl daemon-reload
            systemctl restart kubelet

            echo "Updating coredns config map"
            cfg="/tmp/coredns-config.yml"

            # Export CoreDNS ConfigMap into the file
            kubectl -n kube-system get configmap coredns -o yaml > "$cfg"

            # Patch: append nameservers after /etc/resolv.conf using Jinja list "dns"
            sed -i 's|/etc/resolv.conf|/etc/resolv.conf{% for ns in dns %} {{ ns }}{% endfor %}|' "$cfg"

            # Apply the patched ConfigMap
            kubectl apply -f "$cfg"

            # Restart CoreDNS deployment
            kubectl -n kube-system rollout restart deployment coredns

            # Wait for all pods in all namespaces to be ready (status=Running or Completed)
            echo "Waiting for all pods to be Ready (Running/Completed)..."
            while true; do
              not_ready=$(kubectl get pods --all-namespaces --no-headers 2>/dev/null | awk '{ print $4 }' | grep -vE '^(Running|Completed)$' | wc -l)
              if [ "${not_ready}" -eq 0 ]; then
                echo "All pods are Running or Completed."
                break
              else
                echo "$not_ready pods not yet ready, waiting 5s ..."
                sleep 5
              fi
            done

            echo "Listing all Kubernetes nodes:"
            kubectl get nodes -o wide
            echo "Listing all Kubernetes pods in all namespaces:"
            kubectl get pods --all-namespaces -o wide

            kube_vip="{{ kube_vip }}"
            kubectl get configmap kubeadm-config -n kube-system -o yaml > /tmp/kubeadm-config.yaml
            if grep -q 'controlPlaneEndpoint:' /tmp/kubeadm-config.yaml; then
              sed -i "s|controlPlaneEndpoint:.*|controlPlaneEndpoint: ${kube_vip}:6443|" /tmp/kubeadm-config.yaml
            else
              # Use correct YAML key capitalization!
              sed -i "/ClusterConfiguration:/a\    controlPlaneEndpoint: ${kube_vip}:6443" /tmp/kubeadm-config.yaml
            fi
            kubectl apply -f /tmp/kubeadm-config.yaml
 
            # Update cluster-info
            kubectl get configmap cluster-info -n kube-public -o yaml > /tmp/cluster-info.yaml
            sed -i "s|server: https://.*:6443|server: https://${kube_vip}:6443|" /tmp/cluster-info.yaml
            kubectl apply -f /tmp/cluster-info.yaml
            
            VIP="{{ kube_vip }}"
            KUBE_PORT="6443"
            sed -i "s|server: https://[^:]*:${KUBE_PORT}|server: https://${VIP}:${KUBE_PORT}|" /etc/kubernetes/admin.conf
            KUBECONFIG="${HOME}/.kube/config"
            if [ -f "$KUBECONFIG" ]; then
              sed -i "s|server: https://[^:]*:${KUBE_PORT}|server: https://${VIP}:${KUBE_PORT}|" "$KUBECONFIG"
            fi
            cp /etc/kubernetes/admin.conf $HOME/.kube/config
            mkdir -p /root/.kube
            cp /etc/kubernetes/admin.conf /root/.kube/config
            
            # Update kube-proxy configmap
            kubectl -n kube-system get configmap kube-proxy -o yaml > /tmp/kube-proxy.yaml

            # Update API server endpoint inside kubeconfig
            sed -i "s|server: https://.*:6443|server: https://${kube_vip}:6443|" /tmp/kube-proxy.yaml

            # Apply updated configmap
            kubectl apply -f /tmp/kube-proxy.yaml

            # Restart kube-proxy pods to load new config
            kubectl delete pod -n kube-system -l k8s-app=kube-proxy

            systemctl restart kubelet

            KUBE_VIP="{{ kube_vip }}"
            if kubectl config view --minify | grep -q "server: https://${KUBE_VIP}:6443"; then
              echo "SUCCESS: kube_vip (${KUBE_VIP}) is set in kubeconfig."
              echo "Running: kubeadm init phase certs apiserver --control-plane-endpoint ${KUBE_VIP}:6443"
              kubeadm init phase certs apiserver --control-plane-endpoint ${KUBE_VIP}:6443

            else
              echo "FAIL: kube_vip (${KUBE_VIP}) is NOT set in kubeconfig."
            fi

            K8S_CLIENT_MOUNT_PATH="{{ k8s_client_mount_path }}"

            # Get the certificate key
            CERT_KEY=$(kubeadm init phase upload-certs --upload-certs | tail -1 | tr -d '\r\n ')
            if [ -n "$CERT_KEY" ]; then
              CONTROL_PLANE_JOIN_CMD=$(kubeadm token create --ttl 0 --print-join-command --certificate-key "$CERT_KEY")
              echo "$CONTROL_PLANE_JOIN_CMD" > "${K8S_CLIENT_MOUNT_PATH}/control-plane-join-command.sh"
              echo "Saved control-plane join command to: ${K8S_CLIENT_MOUNT_PATH}/control-plane-join-command.sh"
            else
              echo "ERROR: Certificate key is empty! Cannot generate control-plane join command."
              exit 1
            fi

            # For joining worker nodes (regular join command)
            WORKER_JOIN_CMD=$(kubeadm token create --ttl 0 --print-join-command)
            echo "$WORKER_JOIN_CMD" > "${K8S_CLIENT_MOUNT_PATH}/worker-join-command.sh"
            echo "Saved worker join command to:       ${K8S_CLIENT_MOUNT_PATH}/worker-join-command.sh"

            
            export KUBECONFIG=/etc/kubernetes/admin.conf

            echo "Waiting for at least one READY Kubernetes worker node ..."
            while true; do
              # List nodes, exclude master/control-plane, look for Ready
              if kubectl get nodes --no-headers | grep -Ev 'control-plane|master' | grep ' Ready '; then
                echo "Worker node(s) present and Ready."
                break
              else
                echo "No Ready worker node detected yet. Retrying in 10 seconds..."
                sleep 10
              fi
            done

            #update the kubelet config.yaml
            CONFIG_FILE="/var/lib/kubelet/config.yaml"

            # Update or add the parameters
            sed -i 's|^nodeStatusUpdateFrequency:.*|nodeStatusUpdateFrequency: 10s|' $CONFIG_FILE
            sed -i 's|^nodeStatusReportFrequency:.*|nodeStatusReportFrequency: 60s|' $CONFIG_FILE
            sed -i 's|^syncFrequency:.*|syncFrequency: 60s|' $CONFIG_FILE

            # If a key is missing, append it
            grep -q "^nodeStatusUpdateFrequency:" $CONFIG_FILE || echo "nodeStatusUpdateFrequency: 10s" >> $CONFIG_FILE
            grep -q "^nodeStatusReportFrequency:" $CONFIG_FILE || echo "nodeStatusReportFrequency: 60s" >> $CONFIG_FILE
            grep -q "^syncFrequency:" $CONFIG_FILE || echo "syncFrequency: 60s" >> $CONFIG_FILE

            # Restart kubelet to apply changes
            systemctl restart kubelet

            echo "Installing plugins"
            echo "Installing nfs-client-provisioner"
            /usr/local/bin/helm install nfs-client {{ k8s_client_mount_path }}/nfs-client-provisioner/{{ nfs_subdir_external_provisioner_pkg }}.tar.gz \
              --namespace default --create-namespace \
              --set nfs.server={{ k8s_nfs_server_ip }} \
              --set nfs.path={{ k8s_server_share_path }} \
              --set storageClass.defaultClass=true \
              --set storageClass.reclaimPolicy=Retain
            echo "Waiting for nfs-subdir-external-provisioner pods to appear..."
            # Give controller some time to create pods
            sleep 15

            # Wait only if pods exist
            if kubectl get pods -n default -l app=nfs-subdir-external-provisioner | grep -q nfs-subdir; then
              kubectl wait --for=condition=Ready pod -l app=nfs-subdir-external-provisioner -n default --timeout=300s || true
            else
              echo "Pods not yet created, retrying after 10 seconds..."
              sleep 10
              kubectl wait --for=condition=Ready pod -l app=nfs-subdir-external-provisioner -n default --timeout=300s || true
            fi

            echo "Installing Metallb"
            kubectl create -f {{ k8s_client_mount_path }}/metallb/{{ metallb_package }}.yml
            echo "Waiting for MetalLB pods to be ready..."
            kubectl wait --namespace metallb-system --for=condition=Ready pods --all --timeout=300s
            echo "Waiting for MetalLB webhook to be ready..."
            until kubectl get endpoints metallb-webhook-service -n metallb-system \
              -o jsonpath='{.subsets[*].addresses[*].ip}' | grep -qE '[0-9]'; do
              echo "Webhook endpoints not ready yet. Retrying in 5s..."
              sleep 5
            done
            echo "MetalLB webhook is ready."
            echo "Deploy ipaddress pool"
            kubectl create -f {{ k8s_client_mount_path }}/metallb/ipaddress_pool.yaml
            echo "Deploy Layer2 Configuration"
            kubectl create -f {{ k8s_client_mount_path }}/metallb/l2advertisement.yaml

            #echo "Deploy Multus"
            #kubectl apply -f {{ k8s_client_mount_path }}/multus/{{ multus_package }}.yml
            #echo "Waiting for multus pods to be ready..."
            #kubectl wait --for=condition=Ready pod -l app=multus -n kube-system --timeout=300s

            #echo "Deploy Wherabouts"
            #kubectl apply -f {{ k8s_client_mount_path }}/whereabouts/whereabouts/doc/crds/daemonset-install.yaml
            #kubectl apply -f {{ k8s_client_mount_path }}/whereabouts/whereabouts/doc/crds/whereabouts.cni.cncf.io_ippools.yaml
            #kubectl apply -f {{ k8s_client_mount_path }}/whereabouts/whereabouts/doc/crds/whereabouts.cni.cncf.io_overlappingrangeipreservations.yaml
            #echo "Waiting for whereabouts pods to be ready..."
            #kubectl wait --for=condition=Ready pod -l app=whereabouts -n kube-system --timeout=300s


            export KUBECONFIG=/etc/kubernetes/admin.conf
            echo "Display nodes and pods status after deploying plugins"
            echo "Listing all Kubernetes nodes:"
            kubectl get nodes -o wide

            echo "Listing all Kubernetes pods in all namespaces:"
            kubectl get pods --all-namespaces -o wide

            echo "Rollout and Restart coredns"
            kubectl rollout restart deployment coredns -n kube-system
            echo "Waiting for coredns pods to appear.."
            sleep 30
            kubectl wait --for=condition=Ready pod -l k8s-app=kube-dns -n kube-system --timeout=300s

            CSI_DRIVER_SUPPORT="{{ csi_driver_powerscale_support | lower }}"
            echo "===== Checking if PowerScale CSI driver support is enabled ====="

            if [ "$CSI_DRIVER_SUPPORT" != "true" ]; then
              echo "PowerScale CSI driver support is disabled. Skipping deployment."
              true
            else
              echo "PowerScale CSI driver support is enabled. Proceeding with deployment."
              echo "===== Copying CSI PowerScale driver from NFS-mounted path ====="
              mkdir -p /opt/omnia
              POWERSCALE_DEPLOYMENT_FAILED=0

              if cp -rp {{ k8s_client_mount_path }}/csi-driver-powerscale /opt/omnia/; then
                echo "Copied CSI PowerScale driver to /opt/omnia successfully."
              else
                echo "ERROR: Failed to copy PowerScale driver. Skipping PowerScale deployment."
                POWERSCALE_DEPLOYMENT_FAILED=1
              fi

              if [ "$POWERSCALE_DEPLOYMENT_FAILED" -eq 0 ]; then
                SECRET_FILE="/opt/omnia/csi-driver-powerscale/secret.yaml"
                echo "Checking if creds are provided by user"

                if [[ -f "$SECRET_FILE" ]]; then
                  echo "Found secret file at $SECRET_FILE"
                  csi_username=$(grep -v '^[[:space:]]*#' "$SECRET_FILE" | grep 'username:' | head -1 | awk -F':' '{gsub(/^[[:space:]]+|[[:space:]]+$/, "", $2); print $2}' | base64 --decode 2>/dev/null)
                  csi_password=$(grep -v '^[[:space:]]*#' "$SECRET_FILE" | grep 'password:' | head -1 | awk -F':' '{gsub(/^[[:space:]]+|[[:space:]]+$/, "", $2); print $2}' | base64 --decode 2>/dev/null)

                  if [ -z "${csi_username}" ] || [ -z "${csi_password}" ]; then
                    echo " ERROR: CSI credentials not defined in secret.yaml."
                    POWERSCALE_DEPLOYMENT_FAILED=1
                  else
                    export csi_username
                    export csi_password
                  fi
                else
                  echo "ERROR: secret.yaml not found at $SECRET_FILE."
                  POWERSCALE_DEPLOYMENT_FAILED=1
                fi
              fi

              if [ "$POWERSCALE_DEPLOYMENT_FAILED" -eq 0 ]; then
                echo "===== Checking if PowerScale driver is deployed ====="
                if kubectl get pods -n isilon --no-headers 2>/dev/null | grep -q '^isilon-'; then
                  echo "PowerScale driver is already deployed on the cluster."
                  POWERSCALE_DEPLOYMENT_FAILED=1
                fi
              fi

              if [ "$POWERSCALE_DEPLOYMENT_FAILED" -eq 0 ]; then
                echo "===== Checking Helm installation ====="
                if ! command -v helm >/dev/null 2>&1; then
                  echo "Helm not found. Installing..."
                  /usr/local/bin/install-helm.sh || POWERSCALE_DEPLOYMENT_FAILED=1
                fi
              fi

              if [ "$POWERSCALE_DEPLOYMENT_FAILED" -eq 0 ]; then
                echo "===== Extracting PowerScale host from secret.yaml ====="
                powerscale_endpoint=$(grep '^[[:space:]]*endpoint:' "$SECRET_FILE" | head -1 | awk -F'"' '{print $2}')
                powerscale_host=$(echo "$powerscale_endpoint" | sed -E 's#https?://##' | sed -E 's#/.*##')

                echo "Extracted PowerScale Host: $powerscale_host"
                echo "===== Checking connectivity to PowerScale host ====="
                if ping -c 1 "$powerscale_host" >/dev/null 2>&1; then
                  echo "PowerScale Host ($powerscale_host) is reachable."
                else
                  echo "ERROR: PowerScale Host ($powerscale_host) is NOT reachable."
                  POWERSCALE_DEPLOYMENT_FAILED=1
                fi
              fi

              if [ "$POWERSCALE_DEPLOYMENT_FAILED" -ne 0 ]; then
                echo "PowerScale prerequisites failed. Skipping remaining deployment steps."
                true
              else
                echo "===== Ensuring 'isilon' namespace exists ====="
                kubectl create namespace isilon --dry-run=client -o yaml | kubectl apply -f - || {
                  echo "ERROR: Failed to create or verify 'isilon' namespace."
                  POWERSCALE_DEPLOYMENT_FAILED=1
                }

                if [ "$POWERSCALE_DEPLOYMENT_FAILED" -eq 0 ]; then
                  echo "===== Creating and patching isilon-creds secret ====="
                  kubectl delete secret isilon-creds -n isilon >/dev/null 2>&1 || true
                  kubectl create secret generic isilon-creds -n isilon \
                    --from-file=config="$SECRET_FILE" >/dev/null 2>&1 || POWERSCALE_DEPLOYMENT_FAILED=1

                  if [ "$POWERSCALE_DEPLOYMENT_FAILED" -eq 0 ]; then
                    kubectl get secret isilon-creds -n isilon -o jsonpath='{.data.config}' | base64 -d > /tmp/decoded_config.yaml 2>/dev/null
                    awk -v user="$csi_username" -v pass="$csi_password" '
                      /^[[:space:]]*#/ {print; next}
                      /^ *username:/ {sub(/:.*/, ": " user)}
                      /^ *password:/ {sub(/:.*/, ": " pass)}
                      {print}
                    ' /tmp/decoded_config.yaml > /tmp/updated_config.yaml
                    encoded_config=$(base64 -w 0 /tmp/updated_config.yaml)
                    kubectl patch secret isilon-creds -n isilon \
                      --type merge \
                      -p "{\"data\":{\"config\":\"${encoded_config}\"}}" >/dev/null 2>&1 || POWERSCALE_DEPLOYMENT_FAILED=1
                    rm -f /tmp/decoded_config.yaml /tmp/updated_config.yaml
                    echo "isilon-creds secret created and patched successfully."
                  fi
                fi

                if [ "$POWERSCALE_DEPLOYMENT_FAILED" -eq 0 ]; then
                  echo "===== Applying empty certificate secret ====="
                  if [ -f "/opt/omnia/csi-driver-powerscale/empty_isilon-certs.yaml" ]; then
                    kubectl apply -f /opt/omnia/csi-driver-powerscale/empty_isilon-certs.yaml || {
                      echo "Failed to apply empty certs secret. Continuing..."
                      POWERSCALE_DEPLOYMENT_FAILED=1
                    }
                  fi
                fi

                if [ "$POWERSCALE_DEPLOYMENT_FAILED" -eq 0 ]; then
                  echo "===== Deploying External Snapshotter CRDs ====="
                  if [ -d "/opt/omnia/csi-driver-powerscale/csi-powerscale/external-snapshotter/client/config/crd" ]; then
                    kubectl apply -f /opt/omnia/csi-driver-powerscale/csi-powerscale/external-snapshotter/client/config/crd/ >/dev/null 2>&1 || {
                      echo "CRD deployment failed (expected). Continuing..."
                    }
                  fi
                fi

                if [ "$POWERSCALE_DEPLOYMENT_FAILED" -eq 0 ]; then
                  echo "===== Deploying Snapshot Controller ====="
                  if [ -d "/opt/omnia/csi-driver-powerscale/csi-powerscale/external-snapshotter/deploy/kubernetes/snapshot-controller" ]; then
                    kubectl apply -f /opt/omnia/csi-driver-powerscale/csi-powerscale/external-snapshotter/deploy/kubernetes/snapshot-controller/ >/dev/null 2>&1 || {
                      echo "Snapshot Controller deployment failed (expected). Continuing..."
                    }

                    echo "Updating Snapshot Controller image to v8.3.0..."
                    kubectl set image deployment/snapshot-controller snapshot-controller=registry.k8s.io/sig-storage/snapshot-controller:v8.3.0 -n kube-system >/dev/null 2>&1 || true

                    echo "Waiting for Snapshot Controller rollout to finish (timeout: 5 minutes)..."
                    kubectl rollout status deployment/snapshot-controller -n kube-system --timeout=300s >/dev/null 2>&1 || {
                      echo "Snapshot Controller rollout did not complete in time."
                    }
                    sleep 10
                    echo "Waiting for Snapshot Controller pods to reach Running state..."
                    MAX_ATTEMPTS=60
                    WAIT_TIME=5
                    for ((i=1; i<=MAX_ATTEMPTS; i++)); do
                      not_ready=$(kubectl get pods -n kube-system --no-headers 2>/dev/null | grep snapshot-controller | awk '{ print $3 }' | grep -vE '^(Running|Completed)$' | wc -l)
                      if [ "$not_ready" -eq 0 ]; then
                        echo "Snapshot Controller pods are Running or Completed."
                        break
                      else
                        echo "[$i/$MAX_ATTEMPTS] $not_ready Snapshot Controller pods not ready, waiting ${WAIT_TIME}s..."
                        sleep $WAIT_TIME
                      fi
                    done
                    echo "Snapshot Controller deployment completed (or timed out safely)."
                  fi
                fi

                FILE="/opt/omnia/csi-driver-powerscale/values.yaml"   # <-- update with actual path

                echo "Updating arrayConnectivityPollRate in: $FILE"

                if grep -Fq -- "--arrayConnectivityPollRate=60" "$FILE"; then
                  echo "Found existing poll rate 60. Updating to 20..."
                  sed -i 's/--arrayConnectivityPollRate=60/--arrayConnectivityPollRate=20/g' "$FILE"
                else
                  echo "No poll rate value 60 found. Nothing to change."
                fi

                echo "Done updating poll rate."


                if [ "$POWERSCALE_DEPLOYMENT_FAILED" -eq 0 ]; then
                  echo "===== Running CSI PowerScale installation script ====="
                  INSTALL_SCRIPT="/opt/omnia/csi-driver-powerscale/csi-powerscale/dell-csi-helm-installer/csi-install.sh"
                  if [ -x "$INSTALL_SCRIPT" ]; then
                    cd "$(dirname "$INSTALL_SCRIPT")" || true
                    ./csi-install.sh --namespace isilon --values /opt/omnia/csi-driver-powerscale/values.yaml &
                    CSI_PID=$!
                    echo "Waiting for CSI install script (PID $CSI_PID) to complete..."
                    wait $CSI_PID
                  else
                    echo "ERROR: CSI install script not found."
                    POWERSCALE_DEPLOYMENT_FAILED=1
                  fi
                fi

                if [ "$POWERSCALE_DEPLOYMENT_FAILED" -eq 0 ]; then
                  echo "===== Waiting for CSI pods ====="
                  MAX_ATTEMPTS=10
                  WAIT_TIME=60
                  CSI_READY=0
                  for ((i=1; i<=MAX_ATTEMPTS; i++)); do
                    if kubectl get pods -n isilon --no-headers 2>/dev/null | grep -q '^isilon-'; then
                      NON_RUNNING=$(kubectl get pods -n isilon --no-headers 2>/dev/null | grep '^isilon-' | grep -v "Running" | wc -l)
                      if [ "$NON_RUNNING" -eq 0 ]; then
                        echo "All CSI pods are running."
                        CSI_READY=1
                        break
                      fi
                    fi
                    echo "Attempt $i/$MAX_ATTEMPTS: Waiting for CSI pods to be Running..."
                    kubectl rollout restart deployment isilon-controller -n isilon
                    kubectl rollout restart daemonset isilon-node -n isilon
                    sleep $WAIT_TIME
                  done

                  if [ "$CSI_READY" -eq 1 ]; then
                    echo "CSI PowerScale driver installed successfully."
                    if [ -f "/opt/omnia/csi-driver-powerscale/ps_storage_class.yml" ]; then
                      kubectl apply -f /opt/omnia/csi-driver-powerscale/ps_storage_class.yml
                      echo "PowerScale StorageClass applied successfully."
                    fi
                  else
                    echo "ERROR: CSI PowerScale driver pods not ready after waiting. Skipping StorageClass creation."
                  fi
                  echo "===== PowerScale CSI deployed successfully — updating default StorageClass ====="
                  echo "Checking if StorageClass 'nfs-client' exists..."
                  if kubectl get sc nfs-client >/dev/null 2>&1; then
                    NFS_SC_EXISTS=1
                    echo "nfs-client StorageClass found."
                  else
                    NFS_SC_EXISTS=0
                    echo "nfs-client StorageClass NOT found."
                  fi

                  echo "Checking if StorageClass 'ps01' exists..."
                  if kubectl get sc ps01 >/dev/null 2>&1; then
                    PS01_SC_EXISTS=1
                    echo "ps01 StorageClass found."
                  else
                    PS01_SC_EXISTS=0
                    echo "ps01 StorageClass NOT found."
                  fi

                  # Only proceed if ps01 exists (means CSI is installed correctly)
                  if [ "$PS01_SC_EXISTS" -eq 1 ]; then
                    echo "===== Updating StorageClass defaults ====="

                    # Disable default class on nfs-client
                    if [ "$NFS_SC_EXISTS" -eq 1 ]; then
                      echo "Checking if nfs-client is currently default..."
                      DEFAULT_ANNOT=$(kubectl get sc nfs-client -o jsonpath='{.metadata.annotations.storageclass\.kubernetes\.io/is-default-class}' 2>/dev/null)

                      if [ "$DEFAULT_ANNOT" = "true" ]; then
                        echo "Removing default StorageClass annotation from nfs-client..."
                        kubectl annotate sc nfs-client storageclass.kubernetes.io/is-default-class="false" --overwrite
                      else
                        echo "nfs-client is not default. Skipping."
                      fi
                    fi

                    # Set ps01 as default
                    echo "Setting ps01 as default StorageClass..."
                    kubectl annotate sc ps01 storageclass.kubernetes.io/is-default-class="true" --overwrite

                    echo "===== StorageClass update completed successfully ====="
                  else
                    echo "ps01 StorageClass not found. Cannot update default StorageClass settings."
                  fi
                fi
              fi
            fi
            systemctl restart nfs-client.target
            systemctl restart rpcbind

{% if hostvars['localhost']['idrac_telemetry_support'] or hostvars['localhost']['ldms_support'] %}
            echo "Applying Telemetry Kubernetes deployments"
            /root/telemetry.sh
{% endif %}
            echo "Rollout and Restart coredns"
            kubectl rollout restart deployment coredns -n kube-system
            sleep 30
            echo "Waiting for coredns pods to appear.."
            kubectl wait --for=condition=Ready pod -l k8s-app=kube-dns -n kube-system --timeout=300s
            # Mark initialization complete so all of above is skipped on reboot!
            touch "$MARKER"
            echo "Cloud-Init has completed successfully."
          else
            # SUBSEQUENT BOOT - SKIP INIT
            echo "service_kube_control_plane_first_x86_64 is already part of cluster."
            echo "Cluster already initialized. Performing node reboot procedures."
            # CRI and kubelet already enabled above
            # You can log health status etc if you wish:
            mkdir -p $HOME/.kube /root/.kube
            cp -f /etc/kubernetes/admin.conf $HOME/.kube/config
            chown $(id -u):$(id -g) $HOME/.kube/config
            yes | cp -i /etc/kubernetes/admin.conf /root/.kube/config
            kubectl get nodes -o wide || echo "Cluster not yet fully up"
            kubectl get pods --all-namespaces -o wide || echo "Pods may not be ready yet"
            
            echo "Rollout and Restart coredns"
            kubectl rollout restart deployment coredns -n kube-system
            echo "Waiting for coredns pods to appear.."
            sleep 30
            kubectl wait --for=condition=Ready pod -l k8s-app=kube-dns -n kube-system --timeout=300s
            # Wait for all pods in all namespaces to be ready (status=Running or Completed)
            echo "Waiting for all pods to be Ready (Running/Completed)..."
            while true; do
              not_ready=$(kubectl get pods --all-namespaces --no-headers 2>/dev/null | awk '{ print $4 }' | grep -vE '^(Running|Completed)$' | wc -l)
              if [ "${not_ready}" -eq 0 ]; then
                echo "All pods are Running or Completed."
                break
              else
                echo "$not_ready pods not yet ready, waiting 5s ..."
                sleep 5
              fi
            done

            echo "Listing all Kubernetes nodes:"
            kubectl get nodes -o wide
            echo "Listing all Kubernetes pods in all namespaces:"
            kubectl get pods --all-namespaces -o wide
            echo "Cloud-Init finished successfully after the reboot."

          fi


================================================
FILE: discovery/roles/configure_ochami/templates/cloud_init/ci-group-service_kube_control_plane_x86_64.yaml.j2
================================================
- name: {{ functional_group_name }}
  description: "{{ functional_group_name }}"
  file:
    encoding: plain
    content: |
      ## template: jinja
      #cloud-config

      merge_how:
      - name: list
        settings: [append]
      - name: dict
        settings: [no_replace, recurse_list]

      users:
        - name: root
          ssh_authorized_keys: "{{ read_ssh_key.stdout }}"
          lock_passwd: false
          hashed_passwd: "{{ hashed_password_output.stdout }}"
      disable_root: false

      write_files:
        - path: /usr/local/bin/doca-install.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/doca-ofed/doca-install.sh.j2') | indent(12) }}

        - path: /usr/local/bin/configure-ib-network.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/doca-ofed/configure-ib-network.sh.j2') | indent(12) }}

        - path: /usr/local/bin/set-ssh.sh
          permissions: '0755'
          content: |
            #!/bin/bash
            timedatectl set-timezone {{ hostvars['oim']['oim_timezone'] }}
            sed -i 's/^#PermitRootLogin.*/PermitRootLogin yes/' /etc/ssh/sshd_config
            sed -i 's/^#PasswordAuthentication.*/PasswordAuthentication yes/' /etc/ssh/sshd_config
            sed -i 's/^PasswordAuthentication.*/PasswordAuthentication yes/' /etc/ssh/sshd_config.d/50-cloud-init.conf
            systemctl restart sshd
            default_count=$(ip route | grep -c "^default")
            if [ "$default_count" -le 1 ]; then
                echo "Only one or no default route found. No action needed."
            else
                private_nic=$(ip route | grep "^default via {{ hostvars['localhost']['admin_nic_ip'] }}" | awk '{print $5}')
                # Get all default routes
                ip route | grep '^default' | while read -r line; do
                    nmcli con del "Wired Connection"
                    # Extract NIC name
                    nic=$(echo "$line" | awk '{print $5}')

                    # Add the default route to the connection
                    if [ -n "$nic" ]; then
                        echo "Adding nmcli device $nic"
                        nmcli con add type ethernet ifname "$nic" con-name "$nic" ipv4.method auto
                        if [ "$nic" = "$private_nic" ]; then
                          nmcli con modify "$nic" ipv4.never-default yes
                          nmcli con delete "cloud-init $nic"
                        fi
                        nmcli con up "$nic"
                    else
                        echo "No connection found for device $nic"
                    fi
                done
            fi

        - path: /root/.ssh/config
          permissions: '0600'
          content: |
            Host {{ k8s_control_ssh_patterns }}
                IdentityFile {{ k8s_client_mount_path }}/ssh/oim_rsa
                IdentitiesOnly yes

        - path: /etc/modules-load.d/k8s.conf
          content: |
            br_netfilter
            overlay
            nf_conntrack
            vxlan
          permissions: '0644'
        - path: /etc/sysctl.d/k8s.conf
          content: |
            net.bridge.bridge-nf-call-iptables=1
            net.bridge.bridge-nf-call-ip6tables=1
            net.ipv4.ip_forward=1
            vm.overcommit_memory=1
            kernel.panic=10
          permissions: '0644'
        - path: /etc/fstab
          content: |
            {{ k8s_nfs_server_ip }}:{{ k8s_server_share_path }}   {{ k8s_client_mount_path }}        nfs    noatime,nolock     0 0
            {{ k8s_nfs_server_ip }}:{{ k8s_server_share_path }}/{% raw %}{{ ds.meta_data.instance_data.local_ipv4 }}{% endraw %}/etcd      /var/lib/etcd        nfs noatime,nolock 0 0
            {{ k8s_nfs_server_ip }}:{{ k8s_server_share_path }}/{% raw %}{{ ds.meta_data.instance_data.local_ipv4 }}{% endraw %}/kubelet   /var/lib/kubelet     nfs noatime,nolock 0 0
            {{ k8s_nfs_server_ip }}:{{ k8s_server_share_path }}/{% raw %}{{ ds.meta_data.instance_data.local_ipv4 }}{% endraw %}/kubernetes   /etc/kubernetes      nfs noatime,nolock 0 0
            {{ k8s_nfs_server_ip }}:{{ k8s_server_share_path }}/{% raw %}{{ ds.meta_data.instance_data.local_ipv4 }}{% endraw %}/pod-logs   /var/log/pods      nfs noatime,nolock 0 0
            {{ k8s_nfs_server_ip }}:{{ k8s_server_share_path }}/packages   /var/lib/packages        nfs    noatime,nolock     0 0
            tmpfs   /tmp/crio-storage   tmpfs   size={{ k8s_crio_storage_size }},noatime,nodev,nosuid   0 0
          permissions: '0644'
        - path: /etc/containers/storage.conf
          content: |
            [storage]
            driver = "overlay"
            runroot = "/var/run/containers/storage"
            graphroot = "/tmp/crio-storage"
            [storage.options.overlay]
            mount_program = "/usr/bin/fuse-overlayfs"
          permissions: '0644'
        - path: /tmp/crio.conf
          permissions: '0644'
          content: |
            unqualified-search-registries = ["{{ pulp_mirror }}"]
            [[registry]]
            prefix = "docker.io"
            location = "registry-1.docker.io"
            [[registry.mirror]]
            location = "{{ pulp_mirror }}"
            [[registry]]
            prefix = "ghcr.io"
            location = "ghcr.io"
            [[registry.mirror]]
            location = "{{ pulp_mirror }}"
            [[registry]]
            prefix = "quay.io"
            location = "quay.io"
            [[registry.mirror]]
            location = "{{ pulp_mirror }}"
            [[registry]]
            prefix = "registry.k8s.io"
            location = "registry.k8s.io"
            [[registry.mirror]]
            location = "{{ pulp_mirror }}"
            [[registry]]
            prefix = "nvcr.io"
            location = "nvcr.io"
            [[registry.mirror]]
            location = "{{ pulp_mirror }}"
            [[registry]]
            prefix = "public.ecr.aws"
            location = "public.ecr.aws"
            [[registry.mirror]]
            location = "{{ pulp_mirror }}"
            [[registry]]
            prefix = "gcr.io"
            location = "gcr.io"
            [[registry.mirror]]
            location = "{{ pulp_mirror }}"
{% if user_registry | default([]) | length > 0 %}
{% for registry in user_registry %}

            [[registry]]
            prefix = "{{ registry.host }}"
            location = "{{ registry.host }}"
            [[registry.mirror]]
            location = "{{ pulp_mirror }}"
{% endfor %}
{% endif %}
        - path: /tmp/kube-vip.yaml
          owner: root:root
          permissions: '0644'
          content: |
            apiVersion: v1
            kind: Pod
            metadata:
              creationTimestamp: null
              name: kube-vip
              namespace: kube-system
              uid: kube-vip-pod
            spec:
              containers:
                - args:
                    - manager
                  env:
                    - name: vip_arp
                      value: "true"
                    - name: port
                      value: "6443"
                    - name: vip_nodename
                      valueFrom:
                        fieldRef:
                          fieldPath: spec.nodeName
                    - name: vip_interface
                      value: vip_interface
                    - name: vip_cidr
                      value: "{{ admin_netmask_bits }}"
                    - name: dns_mode
                      value: first
                    - name: cp_enable
                      value: "true"
                    - name: cp_namespace
                      value: kube-system
                    - name: svc_enable
                      value: "true"
                    - name: svc_leasename
                      value: plndr-svcs-lock
                    - name: vip_leaderelection
                      value: "true"
                    - name: vip_leasename
                      value: plndr-cp-lock
                    - name: vip_leaseduration
                      value: "5"
                    - name: vip_renewdeadline
                      value: "3"
                    - name: vip_retryperiod
                      value: "1"
                    - name: vip_address
                      value: {{ kube_vip }}
                    - name: prometheus_server
                      value: :2112
                  image: ghcr.io/kube-vip/kube-vip:v0.8.9
                  imagePullPolicy: IfNotPresent
                  name: kube-vip
                  resources: {}
                  securityContext:
                    capabilities:
                      add:
                        - NET_ADMIN
                        - NET_RAW
                  volumeMounts:
                    - mountPath: /etc/kubernetes/admin.conf
                      name: kubeconfig
              hostAliases:
                - hostnames:
                    - kubernetes
                  ip: 127.0.0.1
              hostNetwork: true
              dnsPolicy: ClusterFirstWithHostNet
              volumes:
                - hostPath:
                    path: /etc/kubernetes/admin.conf
                  name: kubeconfig
            status: {}

        - path: /usr/local/bin/install-helm.sh
          permissions: '0755'
          content: |
            #!/bin/bash
            set -e
            HELM_VERSION="v3.19.0"
            ARCH="amd64"
            cp {{ k8s_client_mount_path }}/helm/linux-${ARCH}/helm /usr/local/bin/helm
            chmod +x /usr/local/bin/helm

            # Optional: Set up bash completion
            /usr/local/bin/helm completion bash > /etc/bash_completion.d/helm.sh
            chmod 0755 /etc/bash_completion.d/helm.sh

      runcmd:
        - /usr/local/bin/set-ssh.sh
        - "systemctl enable chronyd"
        - "systemctl restart chronyd"
        - "chronyc sources"
        - "chronyc -a makestep"
        - sudo swapoff -a
        - sudo sed -i '/ swap / s/^/#/' /etc/fstab
        - sudo setenforce 0 || true
        - sudo sed -i 's/^SELINUX=enforcing/SELINUX=permissive/' /etc/selinux/config

        # Enable and start firewalld
        - systemctl enable firewalld
        - systemctl start firewalld

        # Open essential ports
        - firewall-cmd --permanent --add-port=22/tcp
        - firewall-cmd --permanent --add-port=6443/tcp
        - firewall-cmd --permanent --add-port=2379-2380/tcp
        - firewall-cmd --permanent --add-port=10250/tcp
        - firewall-cmd --permanent --add-port=10251/tcp
        - firewall-cmd --permanent --add-port=10252/tcp
        - firewall-cmd --permanent --add-port=10257/tcp
        - firewall-cmd --permanent --add-port=10259/tcp

        # CNI-related ports if running workloads on control plane (NodePort, CNI, etc.)
        - firewall-cmd --permanent --add-port=30000-32767/tcp
        - firewall-cmd --permanent --add-port=179/tcp
        - firewall-cmd --permanent --add-port=4789/udp
        - firewall-cmd --permanent --add-port=5473/tcp
        - firewall-cmd --permanent --add-port=51820/udp
        - firewall-cmd --permanent --add-port=51821/udp
        - firewall-cmd --permanent --add-port=9100/tcp
        - firewall-cmd --permanent --add-port=7472/tcp
        - firewall-cmd --permanent --add-port=7472/udp
        - firewall-cmd --permanent --add-port=7946/tcp
        - firewall-cmd --permanent --add-port=7946/udp
        - firewall-cmd --permanent --add-port=9090/tcp
        - firewall-cmd --permanent --add-port=8080/tcp
        
        # Enable services
        - firewall-cmd --permanent --add-service=http
        - firewall-cmd --permanent --add-service=https

        # Add pod/service networks
        - firewall-cmd --permanent --zone=trusted --add-source={{ k8s_service_addresses }}
        - firewall-cmd --permanent --zone=trusted --add-source={{ k8s_pod_network_cidr }}
        
        # Set default zone to trusted
        - firewall-cmd --set-default-zone=trusted
        
        # Reload the firewall rules
        - firewall-cmd --reload

        - sudo modprobe br_netfilter || true
        - sudo modprobe overlay || true
        - sudo modprobe nf_conntrack || true
        - sudo modprobe vxlan || true
        - sysctl --system
        - mkdir -p /tmp/crio-storage {{ k8s_client_mount_path }} /var/lib/etcd  /var/lib/kubelet /etc/kubernetes /var/log/pods /var/lib/packages
        - |
          tmpfile=$(mktemp)

          # Extract the first 'search' line only (ignore duplicates)
          search_line=$(grep '^search' /etc/resolv.conf | head -n1)
          [ -n "$search_line" ] && echo "$search_line" > "$tmpfile"

          # Add your new nameserver entries
          {% for ns in dns %}
          echo "nameserver {{ ns }}" >> "$tmpfile"
          {% endfor %}

          # Add remaining lines except search and empty lines
          grep -v '^search' /etc/resolv.conf | grep -v '^$' >> "$tmpfile"

          # Remove duplicate lines
          awk '!seen[$0]++' "$tmpfile" > /etc/resolv.conf
        - |
          if command -v chattr >/dev/null 2>&1; then
            chattr +i /etc/resolv.conf || true
          fi
        - mount -a
        - cp {{ k8s_client_mount_path }}/pulp_webserver.crt /etc/pki/ca-trust/source/anchors
        - update-ca-trust extract
        - sed -i 's/^gpgcheck=1/gpgcheck=0/' /etc/dnf/dnf.conf
        - bash /usr/local/bin/doca-install.sh && bash /usr/local/bin/configure-ib-network.sh
        - mkdir -p /etc/containers/registries.conf.d
        - mv /tmp/crio.conf /etc/containers/registries.conf.d/crio.conf
        - systemctl start crio.service
        - systemctl enable crio.service
        - sudo systemctl enable --now kubelet
        - kubeadm config images pull --kubernetes-version={{ service_k8s_version }}
{% set role_name = 'service_kube_control_plane' %}
{% include 'pull_additional_images.yaml.j2' %}
        - echo "Installing helm"
        - /usr/local/bin/install-helm.sh

        - |
          echo "Installing Necessary Python pip packages"
          python3 -m ensurepip

          PACKAGES=({% for pkg in k8s_pip_packages %}"{{ pkg }}"{% if not loop.last %} {% endif %}{% endfor %})

          for pkg in "${PACKAGES[@]}"; do
              echo "Installing $pkg from offline repo..."
              pip3 install "$pkg" \
                    --find-links="{{ offline_pip_module_path }}/${pkg}/" \
                    --trusted-host "{{ pulp_server_ip }}" \
                    --no-index
          done
          MARKER="/etc/kubernetes/.cluster_initialized"
          export KUBECONFIG="/etc/kubernetes/admin.conf"
          set -e
          if [ ! -f "$MARKER" ]; then
            # Join Kubernetes cluster
            echo "Initial boot - initializing and setting up service_kube_control_plane_x86_64"
            rm -rf /var/lib/etcd/*  /var/lib/kubelet/* /etc/kubernetes/*
            rm -rf /var/lib/etcd/.*  /var/lib/kubelet/.* /etc/kubernetes/.*
            K8S_CLIENT_MOUNT_PATH="{{ k8s_client_mount_path }}"
            NODE_NAME="{% raw %}{{ ds.meta_data.instance_data.local_ipv4 }}{% endraw %}"
            KUBE_VIP="{{ kube_vip }}"
            KUBE_PORT="6443"
            JOIN_CMD_FILE="${K8S_CLIENT_MOUNT_PATH}/control-plane-join-command.sh"

            echo "----------------------------------------------------------------------"
            echo "Waiting for the service_kube_control_plane_first_x86_64 to be initialized."
            echo "This node will automatically join the cluster once it is ready."
            echo "Looking for cluster join command at: $JOIN_CMD_FILE"
            echo "----------------------------------------------------------------------"
            while [ ! -f "$JOIN_CMD_FILE" ]; do
              echo "service_kube_control_plane_first_x86_64 is not ready yet. Waiting for $JOIN_CMD_FILE to be created. Retrying in 10 seconds..."
              sleep 10
            done
            echo "Join command file detected: $JOIN_CMD_FILE"

            echo "Checking if kube-vip (${KUBE_VIP}) is reachable..."
            # Keep pinging kube-vip until it is reachable
            while ! ping -c 1 -W 2 "$KUBE_VIP" >/dev/null 2>&1; do
              echo "kube-vip (${KUBE_VIP}) not reachable. Retrying in 10 seconds..."
              sleep 10
            done
            echo "kube-vip (${KUBE_VIP}) is reachable. Joining this service_kube_control_plane_x86_64 to the cluster now."
            JOIN_CMD="$(cat "$JOIN_CMD_FILE") --node-name ${NODE_NAME} --apiserver-advertise-address ${NODE_NAME}"
            echo "Executing: $JOIN_CMD"
            eval $JOIN_CMD
            mkdir -p /root/.kube
            cp -f /etc/kubernetes/admin.conf /root/.kube/config
            chown root:root /root/.kube/config

            NODE_IP="{% raw %}{{ ds.meta_data.instance_data.local_ipv4 }}{% endraw %}"
            VIP_IFACE=$(ip -o addr show | awk -v ip="$NODE_IP" '$4 ~ ip {print $2}')
            sed -i "s/value: vip_interface/value: ${VIP_IFACE}/" /tmp/kube-vip.yaml
            cp /tmp/kube-vip.yaml /etc/kubernetes/manifests/kube-vip.yaml
        
            if [ -f /etc/kubernetes/kubelet.conf ]; then
              cp /etc/kubernetes/kubelet.conf /etc/kubernetes/kubelet.conf.bak
              sed -i "s#server: https://[^:]*:6443#server: https://{{ kube_vip }}:6443#" /etc/kubernetes/kubelet.conf
              systemctl restart kubelet
            else
              echo "WARNING: /etc/kubernetes/kubelet.conf not found. Kubelet may not be initialized yet."
            fi
            set -e
            echo "Updating the arguments for kube-controller-manager"
            MANIFEST="/etc/kubernetes/manifests/kube-controller-manager.yaml"
            BACKUP="/tmp/kube-controller-manager.yaml"

            ARGS=(
              "--node-monitor-period=5s"
              "--node-monitor-grace-period=40s"
              "--node-eviction-rate=1"
              "--secondary-node-eviction-rate=1"
              "--terminated-pod-gc-threshold=50"
            )

            echo "Backing up kube-controller-manager manifest..."
            cp -a "$MANIFEST" "$BACKUP"

            # -----------------------------------------
            # Update --controllers= argument
            # -----------------------------------------
            OLD="--controllers=*,bootstrapsigner,tokencleaner"
            NEW="--controllers=*,nodeipam,nodelifecycle,bootstrapsigner,tokencleaner"

            echo "Checking and updating controllers argument in: $BACKUP"

            # Detect ANY existing --controllers= line (with or without OLD)
            if grep -Fq -- "--controllers=" "$BACKUP"; then
              echo "Existing controllers line found. Updating..."
              # Replace entire existing controllers argument safely
              sed -i "s|.*--controllers=.*|    - $NEW|" "$BACKUP"
            else
              echo "No controllers line found. Adding new one..."
              # Insert after the kube-controller-manager entry
              sed -i "/- kube-controller-manager/a \ \ \ \ - $NEW" "$BACKUP"
            fi

            for ARG in "${ARGS[@]}"; do
              if grep -Fq -- "$ARG" "$BACKUP"; then
                echo "Already present: $ARG"
              else
                echo "Adding: $ARG"
                sed -i "/- kube-controller-manager/a \ \ \ \ - $ARG" "$BACKUP"
              fi
            done
            yes | cp -i  "$BACKUP" "$MANIFEST"


            echo "All arguments processed successfully."
            echo "kubelet will auto-restart kube-controller-manager within 30-60 seconds."

            echo "Waiting for Kubernetes API..."
            until kubectl get nodes >/dev/null 2>&1; do
              sleep 10
            done

            echo "Updating the kubelet arguments."
            sed -i 's/^shutdownGracePeriod:.*/shutdownGracePeriod: 30s/' /var/lib/kubelet/config.yaml
            sed -i 's/^shutdownGracePeriodCriticalPods:.*/shutdownGracePeriodCriticalPods: 10s/' /var/lib/kubelet/config.yaml

            #update the kubelet config.yaml
            CONFIG_FILE="/var/lib/kubelet/config.yaml"

            # Update or add the parameters
            sed -i 's|^nodeStatusUpdateFrequency:.*|nodeStatusUpdateFrequency: 10s|' $CONFIG_FILE
            sed -i 's|^nodeStatusReportFrequency:.*|nodeStatusReportFrequency: 60s|' $CONFIG_FILE
            sed -i 's|^syncFrequency:.*|syncFrequency: 60s|' $CONFIG_FILE

            # If a key is missing, append it
            grep -q "^nodeStatusUpdateFrequency:" $CONFIG_FILE || echo "nodeStatusUpdateFrequency: 10s" >> $CONFIG_FILE
            grep -q "^nodeStatusReportFrequency:" $CONFIG_FILE || echo "nodeStatusReportFrequency: 60s" >> $CONFIG_FILE
            grep -q "^syncFrequency:" $CONFIG_FILE || echo "syncFrequency: 60s" >> $CONFIG_FILE

            systemctl daemon-reload
            systemctl restart kubelet

            kubectl -n kube-system wait pod/kube-controller-manager-{% raw %}{{ ds.meta_data.instance_data.local_ipv4 }}{% endraw %} --for=condition=Ready --timeout=300s
            systemctl restart nfs-client.target
            systemctl restart rpcbind
              # Mark initialization complete so all of above is skipped on reboot!
            touch "$MARKER"
            echo "Cloud-Init has completed successfully."
          else
            # SUBSEQUENT BOOT - SKIP JOIN
            echo "service_kube_control_plane_x86_64 is already part of cluster."
            echo "Cluster already initialized. Performing node reboot procedures."
            # CRI and kubelet already enabled above
            # You can log health status etc if you wish:
            mkdir -p $HOME/.kube /root/.kube
            cp -f /etc/kubernetes/admin.conf $HOME/.kube/config
            chown $(id -u):$(id -g) $HOME/.kube/config
            yes | cp -i /etc/kubernetes/admin.conf /root/.kube/config
            kubectl get nodes -o wide || echo "Cluster not yet fully up"
            kubectl get pods --all-namespaces -o wide || echo "Pods may not be ready yet"
            echo "Rollout and Restart coredns"
            kubectl rollout restart deployment coredns -n kube-system
            echo "Waiting for coredns pods to appear.."
            sleep 30
            kubectl wait --for=condition=Ready pod -l k8s-app=kube-dns -n kube-system --timeout=300s
            # Wait for all pods in all namespaces to be ready (status=Running or Completed)
            echo "Waiting for all pods to be Ready (Running/Completed)..."
            while true; do
              not_ready=$(kubectl get pods --all-namespaces --no-headers 2>/dev/null | awk '{ print $4 }' | grep -vE '^(Running|Completed)$' | wc -l)
              if [ "${not_ready}" -eq 0 ]; then
                echo "All pods are Running or Completed."
                break
              else
                echo "$not_ready pods not yet ready, waiting 5s ..."
                sleep 5
              fi
            done

            echo "Listing all Kubernetes nodes:"
            kubectl get nodes -o wide
            echo "Listing all Kubernetes pods in all namespaces:"
            kubectl get pods --all-namespaces -o wide
            echo "Cloud-Init finished successfully after the reboot."
          fi


================================================
FILE: discovery/roles/configure_ochami/templates/cloud_init/ci-group-service_kube_node_x86_64.yaml.j2
================================================
- name: {{ functional_group_name }}
  description: "{{ functional_group_name }}"
  file:
    encoding: plain
    content: |
      ## template: jinja
      #cloud-config

      merge_how:
      - name: list
        settings: [append]
      - name: dict
        settings: [no_replace, recurse_list]

      users:
        - name: root
          ssh_authorized_keys: "{{ read_ssh_key.stdout }}"
          lock_passwd: false
          hashed_passwd: "{{ hashed_password_output.stdout }}"
      disable_root: false

      write_files:
        - path: /usr/local/bin/doca-install.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/doca-ofed/doca-install.sh.j2') | indent(12) }}

        - path: /usr/local/bin/configure-ib-network.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/doca-ofed/configure-ib-network.sh.j2') | indent(12) }}

        - path: /usr/local/bin/set-ssh.sh
          permissions: '0755'
          content: |
            #!/bin/bash
            timedatectl set-timezone {{ hostvars['oim']['oim_timezone'] }}
            sed -i 's/^#PermitRootLogin.*/PermitRootLogin yes/' /etc/ssh/sshd_config
            sed -i 's/^#PasswordAuthentication.*/PasswordAuthentication yes/' /etc/ssh/sshd_config
            sed -i 's/^PasswordAuthentication.*/PasswordAuthentication yes/' /etc/ssh/sshd_config.d/50-cloud-init.conf
            systemctl restart sshd
            default_count=$(ip route | grep -c "^default")
            if [ "$default_count" -le 1 ]; then
                echo "Only one or no default route found. No action needed."
            else
                private_nic=$(ip route | grep "^default via {{ hostvars['localhost']['admin_nic_ip'] }}" | awk '{print $5}')
                # Get all default routes
                ip route | grep '^default' | while read -r line; do
                    nmcli con del "Wired Connection"
                    # Extract NIC name
                    nic=$(echo "$line" | awk '{print $5}')

                    # Add the default route to the connection
                    if [ -n "$nic" ]; then
                        echo "Adding nmcli device $nic"
                        nmcli con add type ethernet ifname "$nic" con-name "$nic" ipv4.method auto
                        if [ "$nic" = "$private_nic" ]; then
                          nmcli con modify "$nic" ipv4.never-default yes
                          nmcli con delete "cloud-init $nic"
                        fi
                        nmcli con up "$nic"
                    else
                        echo "No connection found for device $nic"
                    fi
                done
            fi

        - path: /root/.ssh/config
          permissions: '0600'
          content: |
            Host {{ k8s_control_ssh_patterns }}
                IdentityFile {{ k8s_client_mount_path }}/ssh/oim_rsa
                IdentitiesOnly yes

        - path: /etc/modules-load.d/k8s.conf
          content: |
            br_netfilter
            overlay
            nf_conntrack
            vxlan
          permissions: '0644'
        - path: /etc/sysctl.d/k8s.conf
          content: |
            net.bridge.bridge-nf-call-iptables=1
            net.bridge.bridge-nf-call-ip6tables=1
            net.ipv4.ip_forward=1
            vm.overcommit_memory=1
            kernel.panic=10
          permissions: '0644'
        - path: /etc/fstab
          content: |
            {{ k8s_nfs_server_ip }}:{{ k8s_server_share_path }}   {{ k8s_client_mount_path }}        nfs    noatime,nolock     0 0
            {{ k8s_nfs_server_ip }}:{{ k8s_server_share_path }}/{% raw %}{{ ds.meta_data.instance_data.local_ipv4 }}{% endraw %}/kubelet   /var/lib/kubelet     nfs noatime,nolock 0 0
            {{ k8s_nfs_server_ip }}:{{ k8s_server_share_path }}/{% raw %}{{ ds.meta_data.instance_data.local_ipv4 }}{% endraw %}/kubernetes   /etc/kubernetes      nfs noatime,nolock 0 0
            {{ k8s_nfs_server_ip }}:{{ k8s_server_share_path }}/{% raw %}{{ ds.meta_data.instance_data.local_ipv4 }}{% endraw %}/pod-logs   /var/log/pods      nfs noatime,nolock 0 0
            {{ k8s_nfs_server_ip }}:{{ k8s_server_share_path }}/packages   /var/lib/packages        nfs    noatime,nolock     0 0
            tmpfs   /tmp/crio-storage   tmpfs   size={{ k8s_crio_storage_size }},noatime,nodev,nosuid   0 0
          permissions: '0644'
        - path: /etc/containers/storage.conf
          content: |
            [storage]
            driver = "overlay"
            runroot = "/var/run/containers/storage"
            graphroot = "/tmp/crio-storage"
            [storage.options.overlay]
            mount_program = "/usr/bin/fuse-overlayfs"
          permissions: '0644'
        - path: /tmp/crio.conf
          permissions: '0644'
          content: |
            unqualified-search-registries = ["{{ pulp_mirror }}"]
            [[registry]]
            prefix = "docker.io"
            location = "registry-1.docker.io"
            [[registry.mirror]]
            location = "{{ pulp_mirror }}"
            [[registry]]
            prefix = "ghcr.io"
            location = "ghcr.io"
            [[registry.mirror]]
            location = "{{ pulp_mirror }}"
            [[registry]]
            prefix = "quay.io"
            location = "quay.io"
            [[registry.mirror]]
            location = "{{ pulp_mirror }}"
            [[registry]]
            prefix = "registry.k8s.io"
            location = "registry.k8s.io"
            [[registry.mirror]]
            location = "{{ pulp_mirror }}"
            [[registry]]
            prefix = "nvcr.io"
            location = "nvcr.io"
            [[registry.mirror]]
            location = "{{ pulp_mirror }}"
            [[registry]]
            prefix = "public.ecr.aws"
            location = "public.ecr.aws"
            [[registry.mirror]]
            location = "{{ pulp_mirror }}"
            [[registry]]
            prefix = "gcr.io"
            location = "gcr.io"
            [[registry.mirror]]
            location = "{{ pulp_mirror }}"
{% if user_registry | default([]) | length > 0 %}
{% for registry in user_registry %}

            [[registry]]
            prefix = "{{ registry.host }}"
            location = "{{ registry.host }}"
            [[registry.mirror]]
            location = "{{ pulp_mirror }}"
{% endfor %}
{% endif %}
      runcmd:
        - /usr/local/bin/set-ssh.sh
        - "systemctl enable chronyd"
        - "systemctl restart chronyd"
        - "chronyc sources"
        - "chronyc -a makestep"
        - sudo swapoff -a
        - sudo sed -i '/ swap / s/^/#/' /etc/fstab
        - sudo setenforce 0 || true
        - sudo sed -i 's/^SELINUX=enforcing/SELINUX=permissive/' /etc/selinux/config

         # Enable and start firewalld
        - systemctl enable firewalld
        - systemctl start firewalld

        # Open required ports for kube node
        - firewall-cmd --permanent --add-port=22/tcp
        - firewall-cmd --permanent --add-port=10250/tcp
        - firewall-cmd --permanent --add-port=30000-32767/tcp
        - firewall-cmd --permanent --add-port=179/tcp
        - firewall-cmd --permanent --add-port=4789/udp
        - firewall-cmd --permanent --add-port=5473/tcp
        - firewall-cmd --permanent --add-port=51820/udp
        - firewall-cmd --permanent --add-port=51821/udp
        - firewall-cmd --permanent --add-port=9100/tcp
        - firewall-cmd --permanent --add-port=7472/tcp
        - firewall-cmd --permanent --add-port=7472/udp
        - firewall-cmd --permanent --add-port=7946/tcp
        - firewall-cmd --permanent --add-port=7946/udp
        - firewall-cmd --permanent --add-port=9090/tcp
        - firewall-cmd --permanent --add-port=8080/tcp

        # Enable services
        - firewall-cmd --permanent --add-service=http
        - firewall-cmd --permanent --add-service=https

        # Add Kubernetes pod/service CIDRs (replace with your actual values)
        - firewall-cmd --permanent --zone=trusted --add-source={{ k8s_service_addresses }}
        - firewall-cmd --permanent --zone=trusted --add-source={{ k8s_pod_network_cidr }}

        # Set default zone to trusted
        - firewall-cmd --set-default-zone=trusted

        # Reload rules
        - firewall-cmd --reload

        - sudo modprobe br_netfilter || true
        - sudo modprobe overlay || true
        - sudo modprobe nf_conntrack || true
        - sudo modprobe vxlan || true
        - sysctl --system
        - mkdir -p /tmp/crio-storage {{ k8s_client_mount_path }} /var/lib/kubelet /etc/kubernetes /var/log/pods /var/lib/packages
        - |
          tmpfile=$(mktemp)

          # Extract the first 'search' line only (ignore duplicates)
          search_line=$(grep '^search' /etc/resolv.conf | head -n1)
          [ -n "$search_line" ] && echo "$search_line" > "$tmpfile"

          # Add your new nameserver entries
          {% for ns in dns %}
          echo "nameserver {{ ns }}" >> "$tmpfile"
          {% endfor %}

          # Add remaining lines except search and empty lines
          grep -v '^search' /etc/resolv.conf | grep -v '^$' >> "$tmpfile"

          # Remove duplicate lines
          awk '!seen[$0]++' "$tmpfile" > /etc/resolv.conf
        - |
          if command -v chattr >/dev/null 2>&1; then
            chattr +i /etc/resolv.conf || true
          fi
        - systemctl restart rpcbind
        - mount -a
        - cp {{ k8s_client_mount_path }}/pulp_webserver.crt /etc/pki/ca-trust/source/anchors
        - update-ca-trust extract
        - sed -i 's/^gpgcheck=1/gpgcheck=0/' /etc/dnf/dnf.conf
        - bash /usr/local/bin/doca-install.sh && bash /usr/local/bin/configure-ib-network.sh
        - mkdir -p /etc/containers/registries.conf.d
        - mv /tmp/crio.conf /etc/containers/registries.conf.d/crio.conf
        - systemctl start crio.service
        - systemctl enable crio.service
        - sudo systemctl enable --now kubelet
        - kubeadm config images pull --kubernetes-version={{ service_k8s_version }}
{% set role_name = 'service_kube_node' %}
{% include 'pull_additional_images.yaml.j2' %}
        - |
          set -e
          MARKER="/etc/kubernetes/.cluster_initialized"
          export KUBECONFIG="/etc/kubernetes/admin.conf"
          if [ ! -f "$MARKER" ]; then
            # Join Kubernetes cluster
            echo "Initial boot - initializing and setting up service_kube_node_x86_64"
            rm -rf /var/lib/kubelet/* /etc/kubernetes/*
            rm -rf /var/lib/kubelet/.* /etc/kubernetes/.*
            K8S_CLIENT_MOUNT_PATH="{{ k8s_client_mount_path }}"
            NODE_NAME="{% raw %}{{ ds.meta_data.instance_data.local_ipv4 }}{% endraw %}"
            KUBE_VIP="{{ kube_vip }}"
            JOIN_CMD_FILE="${K8S_CLIENT_MOUNT_PATH}/worker-join-command.sh"
            echo "----------------------------------------------------------------------"
            echo "Waiting for the service_kube_control_plane_first_x86_64 to be initialized."
            echo "This node will automatically join the cluster once it is ready."
            echo "Looking for cluster join command at: $JOIN_CMD_FILE"
            echo "----------------------------------------------------------------------"
            while [ ! -f "$JOIN_CMD_FILE" ]; do
              echo "service_kube_control_plane_first_x86_64 is not ready yet. Waiting for $JOIN_CMD_FILE to be created. Retrying in 10 seconds..."
              sleep 10
            done
            echo "Join command file detected: $JOIN_CMD_FILE"
            echo "Checking if kube-vip (${KUBE_VIP}) is reachable..."
            # Keep pinging kube-vip until it is reachable
            while ! ping -c 1 -W 2 "$KUBE_VIP" >/dev/null 2>&1; do
              echo "kube-vip (${KUBE_VIP}) not reachable. Retrying in 10 seconds..."
              sleep 10
            done
            echo "kube-vip (${KUBE_VIP}) is reachable. Joining this service_kube_node_x86_64 to the cluster now."
            JOIN_CMD="$(cat "$JOIN_CMD_FILE") --node-name ${NODE_NAME}"
            echo "Executing: $JOIN_CMD"
            eval $JOIN_CMD
            sleep 30
            echo "Updating the kubelet arguments."
            sed -i 's/^shutdownGracePeriod:.*/shutdownGracePeriod: 30s/' /var/lib/kubelet/config.yaml
            sed -i 's/^shutdownGracePeriodCriticalPods:.*/shutdownGracePeriodCriticalPods: 10s/' /var/lib/kubelet/config.yaml
            systemctl daemon-reload
            systemctl restart kubelet
            systemctl restart nfs-client.target
            if [ -f /etc/kubernetes/kubelet.conf ]; then
              cp /etc/kubernetes/kubelet.conf /etc/kubernetes/kubelet.conf.bak
              sed -i "s#server: https://[^:]*:6443#server: https://{{ kube_vip }}:6443#" /etc/kubernetes/kubelet.conf
              systemctl restart kubelet
            else
              echo "WARNING: /etc/kubernetes/kubelet.conf not found. Kubelet may not be initialized yet."
            fi
            
            #update the kubelet config.yaml
            CONFIG_FILE="/var/lib/kubelet/config.yaml"

            # Update or add the parameters
            sed -i 's|^nodeStatusUpdateFrequency:.*|nodeStatusUpdateFrequency: 5s|' $CONFIG_FILE
            sed -i 's|^nodeStatusReportFrequency:.*|nodeStatusReportFrequency: 10s|' $CONFIG_FILE
            sed -i 's|^syncFrequency:.*|syncFrequency: 10s|' $CONFIG_FILE

            # If a key is missing, append it
            grep -q "^nodeStatusUpdateFrequency:" $CONFIG_FILE || echo "nodeStatusUpdateFrequency: 5s" >> $CONFIG_FILE
            grep -q "^nodeStatusReportFrequency:" $CONFIG_FILE || echo "nodeStatusReportFrequency: 10s" >> $CONFIG_FILE
            grep -q "^syncFrequency:" $CONFIG_FILE || echo "syncFrequency: 10s" >> $CONFIG_FILE

            # Restart kubelet to apply changes
            systemctl restart kubelet
            # Mark initialization complete so all of above is skipped on reboot!
            touch "$MARKER"
            echo "Cloud-Init has completed successfully."

          else
            # SUBSEQUENT BOOT - SKIP JOIN
            echo "service_kube_node_x86_64 is already part of cluster."
            echo "Cluster already initialized. Performing node reboot procedures."
            # CRI and kubelet already enabled above
            systemctl status kubelet
            echo "Cloud-Init finished successfully after the reboot."
          fi


================================================
FILE: discovery/roles/configure_ochami/templates/cloud_init/ci-group-slurm_control_node_x86_64.yaml.j2
================================================
- name: {{ functional_group_name }}
  description: "{{ functional_group_name }}"

  file:
    encoding: plain
    content: |
      ## template: jinja
      #cloud-config
      merge_how:
      - name: list
        settings: [append]
      - name: dict
        settings: [no_replace, recurse_list]

      users:
        - name: root
          ssh_authorized_keys: "{{ read_ssh_key.stdout }}"
          lock_passwd: false
          hashed_passwd: "{{ hashed_password_output.stdout }}"
        - name: {{ slurm_user }}
          uid: {{ slurm_uid }}
          system: true
          no_create_home: true
          shell: /sbin/nologin
      disable_root: false

      write_files:
        - path: /usr/local/bin/doca-install.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/doca-ofed/doca-install.sh.j2') | indent(12) }}

        - path: /usr/local/bin/configure-ib-network.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/doca-ofed/configure-ib-network.sh.j2') | indent(12) }}

        - path: /usr/local/bin/set-ssh.sh
          permissions: '{{ file_mode_755 }}'
          content: |
            timedatectl set-timezone {{ hostvars['oim']['oim_timezone'] }}
            sed -i 's/^#PermitRootLogin.*/PermitRootLogin yes/' /etc/ssh/sshd_config
            sed -i 's/^#PasswordAuthentication.*/PasswordAuthentication yes/' /etc/ssh/sshd_config
            sed -i 's/^PasswordAuthentication.*/PasswordAuthentication yes/' /etc/ssh/sshd_config.d/50-cloud-init.conf
            systemctl restart sshd
            default_count=$(ip route | grep -c "^default")
            if [ "$default_count" -le 1 ]; then
                echo "Only one or no default route found. No action needed."
            else
                private_nic=$(ip route | grep "^default via {{ hostvars['localhost']['admin_nic_ip'] }}" | awk '{print $5}')
                # Get all default routes
                ip route | grep '^default' | while read -r line; do
                    nmcli con del "Wired Connection"
                    # Extract NIC name
                    nic=$(echo "$line" | awk '{print $5}')

                    # Add the default route to the connection
                    if [ -n "$nic" ]; then
                        echo "Adding nmcli device $nic"
                        nmcli con add type ethernet ifname "$nic" con-name "$nic" ipv4.method auto
                        if [ "$nic" = "$private_nic" ]; then
                          nmcli con modify "$nic" ipv4.never-default yes
                          nmcli con delete "cloud-init $nic"
                        fi
                        nmcli con up "$nic"
                    else
                        echo "No connection found for device $nic"
                    fi
                done
            fi

        - path: /root/.ssh/config
          permissions: '0600'
          content: |
            Host {{ slurm_control_ssh_patterns }}
                IdentityFile {{ client_mount_path }}/slurm/ssh/oim_rsa
                IdentitiesOnly yes

{% if powervault_config is defined %}
        - path: /usr/local/bin/setup_iscsi_storage.sh
          permissions: '{{ file_mode_755 }}'
          content: |
            #!/bin/bash
            set -euo pipefail

            LOGFILE="/var/log/omnia_iscsi_setup.log"
            exec > >(tee -a "$LOGFILE") 2>&1

            log() { echo "[$(date '+%Y-%m-%d %H:%M:%S')] $*"; }

            PORTALS=({% for ip in powervault_config.ip %}"{{ ip }}" {% endfor %})
            PORT="{{ powervault_config.port | default(3260) }}"
            INITIATOR_IQN="{{ powervault_config.iscsi_initiator | default('') }}"
            VOLUME_ID="{{ powervault_config.volume_id | default('') }}"
            FS_TYPE="{{ powervault_config.fs_type | default('xfs') }}"
            MOUNT_OPTS="{{ powervault_config.mount_options | default('defaults,_netdev,noatime') }}"

            PERSIST_MOUNT="/mnt/slurm-persist"
            MYSQL_SUBDIR="${PERSIST_MOUNT}/mysql"
            SPOOL_SUBDIR="${PERSIST_MOUNT}/spool"

            log "Enabling iSCSI daemon"
            systemctl enable --now iscsid
            /sbin/mpathconf --enable || true

            if [[ -n "${INITIATOR_IQN}" ]]; then
              log "Setting InitiatorName to ${INITIATOR_IQN}"
              if [[ -f /etc/iscsi/initiatorname.iscsi ]] && grep -q "^InitiatorName=${INITIATOR_IQN}$" /etc/iscsi/initiatorname.iscsi; then
                log "InitiatorName already set; not changing"
              else
                printf "InitiatorName=%s\n" "${INITIATOR_IQN}" > /etc/iscsi/initiatorname.iscsi
                log "Restarting iscsid after InitiatorName change"
                systemctl restart iscsid
              fi
            else
              log "INITIATOR_IQN not set; leaving /etc/iscsi/initiatorname.iscsi unchanged"
            fi

            log "Current initiatorname:"
            cat /etc/iscsi/initiatorname.iscsi || true

            log "Discovering iSCSI targets from all portals"
            TARGET_IQN=""

            for ip in "${PORTALS[@]}"; do
              log "Trying discovery on ${ip}:${PORT}"
              OUT=$(iscsiadm -m discovery -t sendtargets -p "${ip}:${PORT}" 2>/dev/null || true)
              echo "$OUT"
              if [[ -z "${TARGET_IQN}" ]]; then
                CANDIDATE_IQN=$(echo "$OUT" | awk '{print $2}' | head -1)
                if [[ -n "${CANDIDATE_IQN}" ]]; then
                  TARGET_IQN="${CANDIDATE_IQN}"
                fi
              fi
            done

            if [[ -z "${TARGET_IQN}" ]]; then
              log "ERROR: Unable to determine target IQN from discovery output"
              exit 1
            fi
            log "Discovered TARGET_IQN=${TARGET_IQN}"

            log "Logging in to ALL discovered iSCSI targets"
            iscsiadm -m node --login || true

            log "Setting automatic startup for all nodes"
            iscsiadm -m node --op update -n node.startup -v automatic || true

            log "Waiting for devices to settle..."
            sleep 5

            log "Enabling multipathd"
            systemctl enable --now multipathd || true

            log "Rescanning iSCSI sessions"
            iscsiadm -m session --rescan || true

            log "Reloading multipath configuration"
            multipath -r || true

            sleep 3

            log "Verifying disks"
            lsblk || true
            lsscsi -s 2>/dev/null | grep -iE "ME|DELL" || true

            log "Multipath devices:"
            multipath -ll || true

            LATEST_MPATH=""

            if [[ -n "${VOLUME_ID}" ]]; then
              log "Selecting multipath using VOLUME_ID match: ${VOLUME_ID}"
              LATEST_MPATH=$(multipath -ll 2>/dev/null | grep -iF "${VOLUME_ID}" | awk '{print $1}' | head -1 || true)
            fi

            if [[ -z "${LATEST_MPATH}" ]]; then
              log "Selecting multipath using vendor match DellEMC,ME5"
              LATEST_MPATH=$(multipath -ll 2>/dev/null | grep -i "DellEMC,ME5" | awk '{print $1}' | head -1 || true)
            fi

            if [[ -z "${LATEST_MPATH}" ]]; then
              log "Selecting multipath using vendor match DellEMC,ME4"
              LATEST_MPATH=$(multipath -ll 2>/dev/null | grep -i "DellEMC,ME4" | awk '{print $1}' | head -1 || true)
            fi

            if [[ -z "${LATEST_MPATH}" ]]; then
              log "Selecting multipath using latest dm-* fallback"
              LATEST=$(multipath -ll 2>/dev/null | grep -oP 'dm-\d+' | sort -t- -k2 -n | tail -1 || true)
              if [[ -z "${LATEST}" ]]; then
                log "ERROR: No multipath dm-* devices detected"
                exit 1
              fi
              LATEST_MPATH=$(multipath -ll 2>/dev/null | grep "${LATEST}" | awk '{print $1}' | head -1 || true)
            fi

            if [[ -z "${LATEST_MPATH}" ]]; then
              log "ERROR: Unable to determine multipath device"
              exit 1
            fi

            MPATH_DEV="/dev/mapper/${LATEST_MPATH}"
            log "Using multipath device: ${MPATH_DEV}"

            PART_DEV="/dev/mapper/${LATEST_MPATH}1"

            if [[ ! -e "${PART_DEV}" ]]; then
              log "Creating GPT label and partition on ${MPATH_DEV}"
              parted -s "${MPATH_DEV}" mklabel gpt
              parted -s "${MPATH_DEV}" mkpart primary "${FS_TYPE}" 0% 100%
              sleep 2
              partprobe "${MPATH_DEV}" || true
              kpartx -av "${MPATH_DEV}" || true
              sleep 2
            fi

            log "Using partition device: ${PART_DEV}"

            if ! blkid -s TYPE -o value "${PART_DEV}" 2>/dev/null | grep -q .; then
              log "Formatting ${PART_DEV} with ${FS_TYPE}"
              mkfs."${FS_TYPE}" -f "${PART_DEV}"
            else
              log "Filesystem already exists on ${PART_DEV}; skipping format"
            fi

            mkdir -p "${PERSIST_MOUNT}"

            UUID=$(blkid -s UUID -o value "${PART_DEV}" 2>/dev/null || true)

            if [[ -n "${UUID}" ]]; then
              log "Using UUID=${UUID} for fstab"
              FSTAB_ENTRY="UUID=${UUID}"
              FSTAB_MATCH="^UUID=${UUID}\\s"
            else
              log "UUID not available, using device path ${PART_DEV} for fstab"
              FSTAB_ENTRY="${PART_DEV}"
              FSTAB_MATCH="^${PART_DEV}\\s"
            fi

            if ! grep -qE "${FSTAB_MATCH}" /etc/fstab; then
              log "Adding persistent mount to /etc/fstab"
              echo "${FSTAB_ENTRY} ${PERSIST_MOUNT} ${FS_TYPE} ${MOUNT_OPTS} 0 0" >> /etc/fstab
            fi

            if ! mountpoint -q "${PERSIST_MOUNT}"; then
              log "Mounting ${PERSIST_MOUNT}"
              mount "${PART_DEV}" "${PERSIST_MOUNT}"
            fi

            df -h "${PERSIST_MOUNT}" || true

            mkdir -p "${MYSQL_SUBDIR}" "${SPOOL_SUBDIR}" /var/lib/mysql /var/spool

            grep -qE "\s+/var/lib/mysql\s+none\s+bind" /etc/fstab || echo "${MYSQL_SUBDIR} /var/lib/mysql none bind 0 0" >> /etc/fstab
            grep -qE "\s+/var/spool\s+none\s+bind" /etc/fstab || echo "${SPOOL_SUBDIR} /var/spool none bind 0 0" >> /etc/fstab

            mount /var/lib/mysql || true
            mount /var/spool || true

            chown -R {{ mysql_user }}:{{ mysql_group }} /var/lib/mysql

            log "Final mount summary:"
            mount | grep -E "/mnt/slurm-persist|/var/lib/mysql|/var/spool" || true

            log "iSCSI sessions:"
            iscsiadm -m session || true

            log "Multipath status:"
            multipath -ll || true

            log "iSCSI/multipath setup complete. Log saved to ${LOGFILE}"
{% endif %}

{% if hostvars['localhost']['openldap_support'] %}
        - path: /etc/sssd/sssd.conf
          owner: root:root
          permissions: '0600'
          content: |
            {{ lookup('template', 'templates/openldap/sssd.conf.j2') | indent(6) }}

        - path: /usr/local/bin/update_ldap_conf.sh
          owner: root:root
          permissions: '0755'
          content: |
            {{ lookup('template', 'templates/openldap/update_ldap_conf.sh.j2') | indent(12) }}
{% endif %}

{% if hostvars['localhost']['ldms_support'] %}
        - path: /root/ldms_sampler.sh
          owner: root:root
          permissions: '0755'
          content: |
            {{ lookup('template', 'templates/ldms/ldms_sampler.sh.j2') | indent(12) }}
{% endif %}

        - path: /etc/hosts
          append: true
          content: |
{% for key in ip_name_map | sort %}
            {{ ip_name_map[key] }} {{ key }}
{% endfor %}

        - path: /root/init_slurm_db.sql
          permissions: '{{ file_mode_600 }}'
          content: |
            SELECT VERSION();
            SHOW DATABASES;
            CREATE DATABASE IF NOT EXISTS {{ apply_config['slurmdbd']['StorageLoc'] }};
            CREATE USER IF NOT EXISTS '{{ apply_config['slurmdbd']['SlurmUser'] }}'@'%' IDENTIFIED BY '{{ hostvars['localhost']['slurm_db_password'] }}';
            ALTER USER '{{ apply_config['slurmdbd']['SlurmUser'] }}'@'%' IDENTIFIED BY '{{ hostvars['localhost']['slurm_db_password'] }}';
            GRANT ALL PRIVILEGES ON {{ apply_config['slurmdbd']['StorageLoc'] }}.* TO '{{ apply_config['slurmdbd']['SlurmUser'] }}'@'%';
            FLUSH PRIVILEGES;

        - path: /root/omnia_slurm_scripts/00_munge_setup.sh
          permissions: '{{ file_mode_755 }}'
          content: |        
            chown -R {{ munge_user }}:{{ munge_group }} /etc/munge
            chmod 700 /etc/munge
            chmod {{ file_mode_400 }} /etc/munge/munge.key
            systemctl enable munge
            systemctl start munge

        - path: /root/omnia_slurm_scripts/01_mariadb_setup.sh
          permissions: '{{ file_mode_755 }}'
          content: |
            #!/bin/bash
            SLURMDBD_CONF="/etc/slurm/slurmdbd.conf"
            SLURM_USER="{{ slurm_user }}"
            SLURM_GROUP="{{ slurm_user }}"
            # Function to extract value from slurm.conf 
            get_value_slurm_conf() {
                local key="$1"
                local default="$2"
                local value
                value=$(grep -iE "^\s*$key\s*=" "$SLURMDBD_CONF" | sed -E 's/^\s*[^=]+=//; s/#.*//; s/\s+$//')
                echo "${value:-$default}"
            }
            chown -R {{ mysql_user }}:{{ mysql_group }} /var/lib/mysql
            chown -R {{ slurm_user }}:{{ slurm_user }} /var/log/mariadb
            chown -R {{ slurm_user }}:{{ slurm_user }} /etc/my.cnf.d # Required? why slurm user for my.cnf?? 
            chown -R {{ slurm_user }}:{{ slurm_user }} {{ slurm_ctld_log_dir_effective }} {{ slurmdbd_log_dir_effective }}
            chmod {{ file_mode_755 }} /etc/my.cnf.d /var/lib/mysql /var/log/mariadb {{ slurm_ctld_log_dir_effective }} {{ slurmdbd_log_dir_effective }}

            #firewall
            systemctl enable firewalld
            systemctl start firewalld
            StoragePort=$(get_value_slurm_conf "StoragePort" "3306")
            firewall-cmd --permanent --add-port="$StoragePort"/tcp
            firewall-cmd --reload
            systemctl enable --now mariadb
            systemctl start mariadb
            mysql -u root < /root/init_slurm_db.sql                 

        - path: /root/omnia_slurm_scripts/02_slurmdbd_setup.sh
          permissions: '{{ file_mode_755 }}'
          content: |
            #!/bin/bash
            SLURMDBD_CONF="/etc/slurm/slurmdbd.conf"
            SLURM_USER="{{ slurm_user }}"
            SLURM_GROUP="{{ slurm_user }}"
            # Function to extract value from slurm.conf 
            get_value_slurm_conf() {
                local key="$1"
                local default="$2"
                local value
                value=$(grep -iE "^\s*$key\s*=" "$SLURMDBD_CONF" | sed -E 's/^\s*[^=]+=//; s/#.*//; s/\s+$//')
                echo "${value:-$default}"
            }
            chmod {{ file_mode_600 }} /etc/slurm/slurmdbd.conf
            chown {{ slurm_user }}:{{ slurm_user }} /etc/slurm/slurmdbd.conf
            #file PidFile
            PidFile=$(get_value_slurm_conf "PidFile" "/var/run/slurmdbd.pid")
            mkdir -pv $(dirname "$PidFile")
            touch $PidFile
            chown -v "$SLURM_USER:$SLURM_GROUP" "$PidFile"
            chmod -v 0755 $PidFile
            #file LogFile
            LogFile=$(get_value_slurm_conf "LogFile" "/var/log/slurmdbd.log")
            mkdir -pv $(dirname "$LogFile")
            touch $LogFile
            chown -v "$SLURM_USER:$SLURM_GROUP" "$LogFile"
            chmod -v 0755 $LogFile
            #firewall
            systemctl enable firewalld
            systemctl start firewalld
            DbdPort=$(get_value_slurm_conf "DbdPort" "6819")
            firewall-cmd --permanent --add-port="$DbdPort"/tcp
            firewall-cmd --reload
            systemctl enable slurmdbd
            systemctl start slurmdbd

        - path: /root/omnia_slurm_scripts/03_slurmctld_setup.sh
          permissions: '{{ file_mode_755 }}'
          content: |
            #!/bin/bash
            SLURM_CONF="/etc/slurm/slurm.conf"
            SLURM_USER="{{ slurm_user }}"
            SLURM_GROUP="{{ slurm_user }}"
            # Function to extract value from slurm.conf 
            get_value_slurm_conf() {
                local key="$1"
                local default="$2"
                local value
                value=$(grep -iE "^\s*$key\s*=" "$SLURM_CONF" | sed -E 's/^\s*[^=]+=//; s/#.*//; s/\s+$//')
                echo "${value:-$default}"
            }
            #dir StateSaveLocation
            StateSaveLocation=$(get_value_slurm_conf "StateSaveLocation" "/var/spool/slurmctld")
            mkdir -pv $StateSaveLocation
            chown -v "$SLURM_USER:$SLURM_GROUP" $StateSaveLocation
            chmod -v 0744 $StateSaveLocation
            #file SlurmctldPidFile
            SlurmctldPidFile=$(get_value_slurm_conf "SlurmctldPidFile" "/var/run/slurmctld.pid")
            mkdir -pv $(dirname "$SlurmctldPidFile")
            touch $SlurmctldPidFile
            chown -v "$SLURM_USER:$SLURM_GROUP" "$SlurmctldPidFile"
            chmod -v 0755 $SlurmctldPidFile
            #file SlurmctldLogFile
            SlurmctldLogFile=$(get_value_slurm_conf "SlurmctldLogFile" "/var/log/slurmctld.log")
            mkdir -pv $(dirname "$SlurmctldLogFile")
            touch $SlurmctldLogFile
            chown -v "$SLURM_USER:$SLURM_GROUP" "$SlurmctldLogFile"
            chmod -v 0755 $SlurmctldLogFile
            #firewall
            systemctl enable firewalld
            systemctl start firewalld
            SlurmctldPort=$(get_value_slurm_conf "SlurmctldPort" "6817")
            firewall-cmd --permanent --add-port="$SlurmctldPort"/tcp
            SrunPortRange=$(get_value_slurm_conf "SrunPortRange" "60001-63000")
            firewall-cmd --permanent --add-port="$SrunPortRange"/tcp
            firewall-cmd --reload
            systemctl enable slurmctld
            systemctl start slurmctld
            systemctl restart slurmctld

        - path: /root/omnia_slurm_scripts/04_track_file.sh
          permissions: '{{ file_mode_755 }}'
          content: |
            #!/bin/bash
            MARKER="/var/log/track/slurm_controller_track"
            if [ -f "$MARKER" ]; then
              echo "Slurm controller track file already exists. Skipping."
              exit 0
            fi

            echo "Waiting for slurmctld to become active..."
            while true; do
              if systemctl is-active --quiet slurmctld; then
                echo "Slurm controller is active."
                touch "$MARKER"
                exit 0
              else
                echo "slurmctld is not active yet. Retrying in 5 seconds."
              fi
              sleep 5
            done

        - path: /tmp/apptainer_mirror.conf
          permissions: '0644'
          content: |
            {{ lookup('template', 'templates/nodes/apptainer_mirror.conf.j2') | indent(12) }}

      runcmd:
         - /usr/local/bin/set-ssh.sh

         
         # Ensure Slurm NFS root is mounted at client_mount_path (e.g. /share_omnia)
         - mkdir -p {{ client_mount_path }}/slurm/ssh

        # slurm user and group created in the users module
        # Create directories for nfs and mount all
         - mkdir -p {{ slurm_ctld_log_dir_effective }} {{ slurmdbd_log_dir_effective }} {{ slurm_ctld_pid_dir_effective }} {{ slurmdbd_pid_dir_effective }} {{ slurm_state_save_location_effective }} {% if slurm_sched_log_dir_effective %}{{ slurm_sched_log_dir_effective }} {% endif %}/etc/slurm {{ home_dir }} /etc/my.cnf.d /etc/munge /var/lib/mysql /var/log/mariadb /cert /var/log/track /var/lib/packages /hpc_tools/container_images /hpc_tools/scripts
         - echo "{{ cloud_init_nfs_path }}/cert  /cert   nfs defaults,_netdev 0 0" >> /etc/fstab
         - echo "{{ cloud_init_nfs_path }}/$(hostname -s)/etc/slurm      /etc/slurm       nfs defaults,_netdev 0 0" >> /etc/fstab
         - echo "{{ cloud_init_nfs_path }}/$(hostname -s)/etc/my.cnf.d   /etc/my.cnf.d    nfs defaults,_netdev 0 0" >> /etc/fstab
         - echo "{{ cloud_init_nfs_path }}/$(hostname -s)/var/log/mariadb /var/log/mariadb nfs defaults,_netdev 0 0" >> /etc/fstab
         - echo "{{ cloud_init_nfs_path }}/$(hostname -s)/var/log/slurm  {{ slurm_ctld_log_dir_effective }}   nfs defaults,_netdev 0 0" >> /etc/fstab
{% if slurmdbd_log_dir_effective != slurm_ctld_log_dir_effective %}
         - echo "{{ cloud_init_nfs_path }}/$(hostname -s)/var/log/slurm  {{ slurmdbd_log_dir_effective }}   nfs defaults,_netdev 0 0" >> /etc/fstab
{% endif %}
{% if powervault_config is not defined %}
         - echo "{{ cloud_init_nfs_path }}/$(hostname -s)/var/lib/mysql  /var/lib/mysql   nfs defaults,_netdev 0 0" >> /etc/fstab
         - echo "{{ cloud_init_nfs_path }}/$(hostname -s)/var/spool/slurmctld     {{ slurm_state_save_location_effective }}      nfs defaults,_netdev 0 0" >> /etc/fstab
{% endif %}
         - echo "{{ cloud_init_nfs_path }}/$(hostname -s)/etc/munge      /etc/munge       nfs defaults,_netdev 0 0" >> /etc/fstab
         - echo "{{ trackfile_nfs_path }}    /var/log/track       nfs defaults,_netdev 0 0" >> /etc/fstab
         - echo "{{ cloud_init_nfs_path}}/hpc_tools/container_images  /hpc_tools/container_images   nfs defaults,_netdev 0 0" >> /etc/fstab
         - echo "{{ cloud_init_nfs_path}}/hpc_tools/scripts  /hpc_tools/scripts   nfs defaults,_netdev 0 0" >> /etc/fstab
         - echo "{{ cloud_init_nfs_path }}/packages  /var/lib/packages   nfs defaults,_netdev 0 0" >> /etc/fstab
         - echo "{{ cloud_init_nfs_path }}/ssh {{ client_mount_path }}/slurm/ssh nfs defaults,_netdev 0 0" >> /etc/fstab
         - chmod {{ file_mode }} /etc/fstab
         - mount -a
         - cp /cert/pulp_webserver.crt /etc/pki/ca-trust/source/anchors && update-ca-trust
         - sed -i 's/^gpgcheck=1/gpgcheck=0/' /etc/dnf/dnf.conf
         - bash /usr/local/bin/doca-install.sh && bash /usr/local/bin/configure-ib-network.sh
{% if powervault_config is defined %}
         - /usr/local/bin/setup_iscsi_storage.sh
{% endif %}

         - chown -R {{ slurm_user }}:{{ slurm_user }} {{ home_dir }}
         - chmod {{ file_mode_755 }} {{ home_dir }}

         - chown -R {{ slurm_user }}:{{ slurm_user }} /etc/slurm
         - chmod {{ file_mode_755 }} /etc/slurm
         - chmod {{ file_mode }} /etc/slurm/slurm.conf

         - setenforce 0

         - ['bash', '/root/omnia_slurm_scripts/00_munge_setup.sh']
         - ['bash', '/root/omnia_slurm_scripts/01_mariadb_setup.sh']
         - ['bash', '/root/omnia_slurm_scripts/02_slurmdbd_setup.sh']
         - ['bash', '/root/omnia_slurm_scripts/03_slurmctld_setup.sh']
         - ['bash', '/root/omnia_slurm_scripts/04_track_file.sh']

         - sed -i 's/^PasswordAuthentication no/PasswordAuthentication yes/' /etc/ssh/sshd_config.d/50-cloud-init.conf
         - firewall-cmd --permanent --add-service=ssh
         - firewall-cmd --reload
         - systemctl enable sshd
         - systemctl start sshd

         - cp /cert/pulp_webserver.crt /etc/pki/ca-trust/source/anchors && update-ca-trust
         - sed -i 's/^gpgcheck=1/gpgcheck=0/' /etc/dnf/dnf.conf
         - mkdir -p /etc/containers/registries.conf.d
         - mv /tmp/apptainer_mirror.conf /etc/containers/registries.conf.d/apptainer_mirror.conf

{% if hostvars['localhost']['openldap_support'] %}
         - /usr/local/bin/update_ldap_conf.sh
         - mkdir /ldapcerts
         - echo "{{ cloud_init_nfs_path_openldap }}/certs                /ldapcerts       nfs defaults,_netdev 0 0" >> /etc/fstab
         - echo "{{ cloud_init_nfs_path_openldap }}/ldapuser             /home            nfs defaults,_netdev 0 0" >> /etc/fstab
         - chmod {{ file_mode }} /etc/fstab
         - mount -a
         - yes | cp /ldapcerts/* /etc/openldap/certs
         - umount /ldapcerts

         - firewall-cmd --permanent --add-port={{ ldap_starttls_port }}/tcp
         - firewall-cmd --permanent --add-port={{ ldap_ssl_port }}/tcp
         - firewall-cmd --reload

         - authselect select sssd with-mkhomedir --force
         - sudo systemctl enable --now oddjobd.service
         - sudo systemctl enable --now sssd
         - setsebool -P authlogin_nsswitch_use_ldap on
         - setsebool -P authlogin_yubikey on
         - sudo systemctl restart sssd
         - systemctl restart sshd
{% endif %}

{% if hostvars['localhost']['ldms_support'] %}
         - echo " Starting LDMS setup " | tee -a /var/log/ldms-cloudinit.log

         # Add NFS entry and mount
         - mkdir -p {{ client_mount_path }}
         - echo "{{ cloud_init_slurm_nfs_path }} {{ client_mount_path }} nfs defaults,_netdev 0 0" >> /etc/fstab
         - mount -a

         - /root/ldms_sampler.sh
{% endif %}
         - systemctl restart slurmdbd
         - systemctl restart slurmctld
         - echo "Cloud-Init has completed successfully."


================================================
FILE: discovery/roles/configure_ochami/templates/cloud_init/ci-group-slurm_node_aarch64.yaml.j2
================================================
- name: {{ functional_group_name }}
  description: "{{ functional_group_name }}"

  file:
    encoding: plain
    content: |
      ## template: jinja
      #cloud-config
      merge_how:
      - name: list
        settings: [append]
      - name: dict
        settings: [no_replace, recurse_list]

      users:
        - name: root
          ssh_authorized_keys: "{{ read_ssh_key.stdout }}"
          lock_passwd: false
          hashed_passwd: "{{ hashed_password_output.stdout }}"
        - name: {{ slurm_user }}
          uid: {{ slurm_uid }}
          system: true
          no_create_home: true
          shell: /sbin/nologin
      disable_root: false

      write_files:
        - path: /usr/local/bin/doca-install.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/doca-ofed/doca-install.sh.j2') | indent(12) }}

        - path: /usr/local/bin/configure-ib-network.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/doca-ofed/configure-ib-network.sh.j2') | indent(12) }}

        - path: /usr/local/bin/set-ssh.sh
          permissions: '{{ file_mode_755 }}'
          content: |
            #!/bin/bash
            timedatectl set-timezone {{ hostvars['oim']['oim_timezone'] }}
            sed -i 's/^#PermitRootLogin.*/PermitRootLogin yes/' /etc/ssh/sshd_config
            sed -i 's/^#PasswordAuthentication.*/PasswordAuthentication yes/' /etc/ssh/sshd_config
            sed -i 's/^PasswordAuthentication.*/PasswordAuthentication yes/' /etc/ssh/sshd_config.d/50-cloud-init.conf
            systemctl restart sshd
            default_count=$(ip route | grep -c "^default")
            if [ "$default_count" -le 1 ]; then
                echo "Only one or no default route found. No action needed."
            else
                private_nic=$(ip route | grep "^default via {{ hostvars['localhost']['admin_nic_ip'] }}" | awk '{print $5}')
                # Get all default routes
                ip route | grep '^default' | while read -r line; do
                    nmcli con del "Wired Connection"
                    # Extract NIC name
                    nic=$(echo "$line" | awk '{print $5}')

                    # Add the default route to the connection
                    if [ -n "$nic" ]; then
                        echo "Adding nmcli device $nic"
                        nmcli con add type ethernet ifname "$nic" con-name "$nic" ipv4.method auto
                        if [ "$nic" = "$private_nic" ]; then
                          nmcli con modify "$nic" ipv4.never-default yes
                          nmcli con delete "cloud-init $nic"
                        fi
                        nmcli con up "$nic"
                    else
                        echo "No connection found for device $nic"
                    fi
                done
            fi

        - path: /root/.ssh/config
          permissions: '0600'
          content: |
            Host {{ slurm_control_ssh_patterns }}
                IdentityFile {{ client_mount_path }}/slurm/ssh/oim_rsa
                IdentitiesOnly yes

        - path: /usr/local/bin/install_nvidia_driver.sh
          permissions: '0755'
          content: |
            #!/bin/bash
            LOGFILE="/var/log/nvidia_install.log"
            exec > >(tee -a "$LOGFILE") 2>&1

            echo "===== Starting NVIDIA GPU detection and driver installation ====="

            # Check for NVIDIA GPU presence
            echo "[INFO] Checking for NVIDIA GPU..."
            if ! lspci | grep -i nvidia &>/dev/null; then
                echo "[INFO] No NVIDIA GPU detected. Exiting."
                exit 0
            fi

            echo "[INFO] NVIDIA GPU detected. Proceeding with setup."

            # Check if NVIDIA driver is already installed
            if command -v nvidia-smi &>/dev/null; then
                echo "[INFO] NVIDIA driver already installed. Skipping driver installation."
            else
                echo "[INFO] Mounting NFS runfile directory for driver installation..."
                mkdir -p /gpu-runfile
                mount -t nfs {{ cloud_init_nfs_path }}/hpc_tools/runfile /gpu-runfile

                if [ $? -ne 0 ]; then
                    echo "[ERROR] Failed to mount NFS runfile share. Exiting."
                    exit 1
                fi

                echo "[INFO] Installing NVIDIA driver..."
                if [ -f "/gpu-runfile/{{ cuda_runfile_aarch64 }}" ]; then
                    bash /gpu-runfile/{{ cuda_runfile_aarch64 }} --silent --driver --no-opengl-libs --kernel-source-path=/lib/modules/$(uname -r)/build
                    if [ $? -eq 0 ] && command -v nvidia-smi &>/dev/null; then
                        echo "[SUCCESS] NVIDIA driver installed successfully."
                        nvidia-smi -pm 1
                    else
                        echo "[ERROR] NVIDIA driver installation failed."
                    fi
                else
                    echo "[ERROR] NVIDIA driver runfile not found in /gpu-runfile/"
                fi

                echo "[INFO] Cleaning up temporary NFS mount..."
                umount /gpu-runfile 2>/dev/null
                rmdir /gpu-runfile 2>/dev/null
            fi

            echo "[INFO] Setting up CUDA toolkit mount..."
            # Unmount first if already mounted
            umount /usr/local/cuda 2>/dev/null

            # Create mount point
            mkdir -p /usr/local/cuda

            cuda_nfs_share="{{ cloud_init_nfs_path }}/hpc_tools/cuda"

            echo "[INFO] Mounting CUDA toolkit from NFS: $cuda_nfs_share"
            mount -t nfs "$cuda_nfs_share" /usr/local/cuda

            if [ $? -eq 0 ]; then
                echo "[SUCCESS] CUDA toolkit NFS mount successful"
                
                # Add to fstab for persistence
                grep -q "$cuda_nfs_share" /etc/fstab || echo "$cuda_nfs_share /usr/local/cuda nfs defaults,_netdev 0 0" >> /etc/fstab
                
                echo "[INFO] Configuring persistent CUDA environment..."
                
                # System-wide profile for login shells
                cat > /etc/profile.d/cuda.sh << 'EOF'
            export PATH=/usr/local/cuda/bin:$PATH
            export LD_LIBRARY_PATH=/usr/local/cuda/lib64:$LD_LIBRARY_PATH
            export CUDA_HOME=/usr/local/cuda
            EOF
                chmod +x /etc/profile.d/cuda.sh
                
                # Bashrc for non-login shells
                cat > /etc/bashrc.cuda << 'EOF'
            if [ -d "/usr/local/cuda/bin" ]; then
                export PATH="/usr/local/cuda/bin:$PATH"
                export LD_LIBRARY_PATH="/usr/local/cuda/lib64:$LD_LIBRARY_PATH"
                export CUDA_HOME="/usr/local/cuda"
            fi
            EOF
                grep -q "bashrc.cuda" /etc/bashrc || echo "source /etc/bashrc.cuda" >> /etc/bashrc
                
                # Slurm prolog for job environment
                mkdir -p /etc/slurm/prolog.d
                cat > /etc/slurm/prolog.d/cuda.sh << 'EOF'
            #!/bin/bash
            export PATH=/usr/local/cuda/bin:$PATH
            export LD_LIBRARY_PATH=/usr/local/cuda/lib64:$LD_LIBRARY_PATH
            export CUDA_HOME=/usr/local/cuda
            EOF
                chmod +x /etc/slurm/prolog.d/cuda.sh
                
                # Apply immediately for current session
                export PATH=/usr/local/cuda/bin:$PATH
                export LD_LIBRARY_PATH=/usr/local/cuda/lib64:$LD_LIBRARY_PATH
                export CUDA_HOME=/usr/local/cuda
                
                echo "[SUCCESS] Persistent CUDA environment configured"
            else
                echo "[ERROR] Failed to mount CUDA toolkit NFS share"
                # Clean up failed mount
                rmdir /usr/local/cuda 2>/dev/null
                exit 1
            fi

            echo "[INFO] Verifying installation..."
            if command -v nvidia-smi &>/dev/null; then
                nvidia_version=$(nvidia-smi --version | head -n1)
                echo "[SUCCESS] NVIDIA driver: $nvidia_version"
            else
                echo "[ERROR] NVIDIA driver not found."
            fi

            if command -v nvcc &>/dev/null; then
                cuda_version=$(nvcc --version | grep "release" | awk '{print $6}' | sed 's/,//')
                echo "[SUCCESS] CUDA toolkit: version $cuda_version"
            else
                echo "[ERROR] CUDA toolkit (nvcc) not found."
            fi

            echo "[INFO] Testing persistence in new shell..."
            bash -c 'nvcc --version > /dev/null 2>&1'
            if [ $? -eq 0 ]; then
                echo "[SUCCESS] CUDA persistence test passed"
            else
                echo "[WARNING] CUDA persistence test failed - manual PATH setup may be needed"
            fi

            echo "===== NVIDIA GPU setup completed ====="

{% if hostvars['localhost']['openldap_support'] %}
        - path: /etc/sssd/sssd.conf
          owner: root:root
          permissions: '0600'
          content: |
            {{ lookup('template', 'templates/openldap/sssd.conf.j2') | indent(6) }}

        - path: /usr/local/bin/update_ldap_conf.sh
          owner: root:root
          permissions: '0755'
          content: |
            {{ lookup('template', 'templates/openldap/update_ldap_conf.sh.j2') | indent(12) }}
{% endif %}

{% if hostvars['localhost']['ldms_support'] %}
        - path: /root/ldms_sampler.sh
          owner: root:root
          permissions: '0755'
          content: |
            {{ lookup('template', 'templates/ldms/ldms_sampler.sh.j2') | indent(12) }}
{% endif %}
        - path: /usr/local/bin/configure_dirs_and_mounts.sh
          permissions: '{{ file_mode_755 }}'
          content: |
            #!/bin/bash
            LOGFILE="/var/log/configure_dirs_and_mounts.log"
            exec > >(tee -a "$LOGFILE") 2>&1

            echo "[INFO] ===== Starting directory creation and NFS mounts for Pulp cert, Slurm and Munge (aarch64) ====="
            mkdir -p {{ client_mount_path }}/slurm/ssh
            echo "[INFO] Creating base directories for Slurm and Munge"
            mkdir -pv {{ slurm_slurmd_log_dir_effective }} {{ slurm_slurmd_pid_dir_effective }} {{ slurm_slurmd_spool_dir_effective }} {{ slurm_epilog_dirs_all | join(' ') }} {% for d in slurm_prolog_dirs_all %}{{ d }} {% endfor %}/etc/munge /cert /var/log/track /var/lib/packages /hpc_tools/container_images /hpc_tools/scripts

            echo "[INFO] Updating /etc/fstab with NFS entries for Pulp cert, Slurm and Munge paths"
            echo "{{ cloud_init_nfs_path }}/$(hostname -s)/var/log/slurm  {{ slurm_slurmd_log_dir_effective }}   nfs defaults,_netdev 0 0" >> /etc/fstab
            echo "{{ cloud_init_nfs_path }}/$(hostname -s)/var/spool/slurmd      {{ slurm_slurmd_spool_dir_effective }}       nfs defaults,_netdev 0 0" >> /etc/fstab
            echo "{{ cloud_init_nfs_path }}/$(hostname -s)/etc/slurm/epilog.d     /etc/slurm/epilog.d      nfs defaults,_netdev 0 0" >> /etc/fstab
            echo "{{ cloud_init_nfs_path }}/$(hostname -s)/etc/munge      /etc/munge       nfs defaults,_netdev 0 0" >> /etc/fstab
            echo "{{ trackfile_nfs_path }}    /var/log/track       nfs defaults,_netdev 0 0" >> /etc/fstab
            echo "{{ cloud_init_nfs_path}}/hpc_tools/container_images  /hpc_tools/container_images   nfs defaults,_netdev 0 0" >> /etc/fstab
            echo "{{ cloud_init_nfs_path }}/ssh {{ client_mount_path }}/slurm/ssh nfs defaults,_netdev 0 0" >> /etc/fstab
            echo "{{ cloud_init_nfs_path}}/hpc_tools/scripts  /hpc_tools/scripts   nfs defaults,_netdev 0 0" >> /etc/fstab
            echo "{{ cloud_init_nfs_path }}/cert  /cert   nfs defaults,_netdev 0 0" >> /etc/fstab
            echo "{{ cloud_init_slurm_nfs_path }} {{ client_mount_path }} nfs defaults,_netdev 0 0" >> /etc/fstab
            echo "{{ cloud_init_nfs_path }}/packages  /var/lib/packages   nfs defaults,_netdev 0 0" >> /etc/fstab

            chmod {{ file_mode }} /etc/fstab

            echo "[INFO] Mounting all NFS entries from /etc/fstab"
            mount -av
            mkdir -p /etc/containers/registries.conf.d
            mv /tmp/apptainer_mirror.conf /etc/containers/registries.conf.d/apptainer_mirror.conf

            echo "[INFO] ===== Completed directory creation and NFS mounts for Slurm and Munge (aarch64) ====="

        - path: /usr/local/bin/configure_slurmd_setup.sh
          permissions: '{{ file_mode_755 }}'
          content: |
            #!/bin/bash
            LOGFILE="/var/log/configure_slurmd_setup.log"
            exec > >(tee -a "$LOGFILE") 2>&1

            echo "[INFO] ===== Starting slurmd setup (service file, directories, epilog) (aarch64) ====="

            bash /usr/local/bin/check_slurm_controller_status.sh

            echo "[INFO] Setting ownership for Slurm directories"
            chown -R {{ slurm_user }}:{{ slurm_user }} {{ slurm_slurmd_log_dir_effective }}
            chown -R {{ slurm_user }}:{{ slurm_user }} {{ slurm_slurmd_pid_dir_effective }}
            chown -R {{ slurm_user }}:{{ slurm_user }} {{ slurm_slurmd_spool_dir_effective }}

            echo "[INFO] Setting permissions for Slurm directories"
            chmod {{ file_mode_755 }} {{ slurm_slurmd_log_dir_effective }} {{ slurm_slurmd_pid_dir_effective }} {{ slurm_slurmd_spool_dir_effective }}

            echo "[INFO] Ensuring Slurm epilog directory and logout script permissions"
            chmod {{ file_mode_755 }} /etc/slurm/epilog.d/
            chmod {{ file_mode_755 }} /etc/slurm/epilog.d/logout_user.sh
{% for epath in slurm_epilog_custom_paths %}

            echo "[INFO] Checking custom epilog script: {{ epath }}"
            if [ ! -f "{{ epath }}" ]; then
              echo "[INFO] Creating stub epilog script at {{ epath }}"
              mkdir -p "$(dirname '{{ epath }}')"
              printf '#!/bin/bash\n# Custom epilog script placeholder\n# Add your epilog commands here\n' > "{{ epath }}"
              chown {{ slurm_user }}:{{ slurm_user }} "{{ epath }}"
              chmod {{ file_mode_755 }} "{{ epath }}"
            fi
{% endfor %}
{% for ppath in slurm_prolog_custom_paths %}

            echo "[INFO] Checking custom prolog script: {{ ppath }}"
            if [ ! -f "{{ ppath }}" ]; then
              echo "[INFO] Creating stub prolog script at {{ ppath }}"
              mkdir -p "$(dirname '{{ ppath }}')"
              printf '#!/bin/bash\n# Custom prolog script placeholder\n# Add your prolog commands here\n' > "{{ ppath }}"
              chown {{ slurm_user }}:{{ slurm_user }} "{{ ppath }}"
              chmod {{ file_mode_755 }} "{{ ppath }}"
            fi
{% endfor %}

            echo "[INFO] Creating and configuring slurmd spool directory"
            mkdir -p {{ slurm_slurmd_spool_dir_effective }}
            chmod {{ file_mode_755 }} {{ slurm_slurmd_spool_dir_effective }}
            chown -R {{ slurm_user }}:{{ slurm_user }} {{ slurm_slurmd_spool_dir_effective }}

            echo "[INFO] ===== Completed slurmd setup (aarch64) ====="

        - path: /usr/local/bin/configure_munge_and_pam.sh
          permissions: '{{ file_mode_755 }}'
          content: |
            #!/bin/bash
            LOGFILE="/var/log/configure_munge_and_pam.log"
            exec > >(tee -a "$LOGFILE") 2>&1

            echo "[INFO] ===== Starting Munge key and PAM configuration (aarch64) ====="

            echo "[INFO] Setting ownership and permissions for Munge key"
            chown -R {{ munge_user }}:{{ munge_group }} /etc/munge/munge.key
            chmod {{ file_mode_400 }} /etc/munge/munge.key

            echo "[INFO] Updating PAM configuration for pam_slurm_adopt in /etc/pam.d/sshd"
            sed -i '/^password\s\+include\s\+password-auth/i account    required    pam_slurm_adopt.so action_no_jobs=deny' /etc/pam.d/sshd

            echo "[INFO] ===== Completed Munge key and PAM configuration (aarch64) ====="

        - path: /usr/local/bin/configure_firewall_and_services.sh
          permissions: '{{ file_mode_755 }}'
          content: |
            #!/bin/bash
            LOGFILE="/var/log/configure_firewall_and_services.log"
            exec > >(tee -a "$LOGFILE") 2>&1

            echo "[INFO] ===== Starting firewall and service configuration (aarch64) ====="

            echo "[INFO] Enabling and starting firewalld"
            systemctl enable firewalld
            systemctl start firewalld

            # Default values in case parsing slurm.conf fails
            DEFAULT_SRUN_RANGE="60001-63000"
            DEFAULT_SLURMD_PORT="6818"

            CTLD_SLURM_DIR_MNT="/mnt/slurm_ctld_etc_slurm"
            SLURM_CONF_PATH="$CTLD_SLURM_DIR_MNT/slurm.conf"

            echo "[INFO] Mounting controller slurm.conf from NFS: {{ cloud_init_nfs_path }}/{{ ctld_list[0] }}/etc/slurm -> $CTLD_SLURM_DIR_MNT"
            mkdir -p "$CTLD_SLURM_DIR_MNT"
            mount -t nfs "{{ cloud_init_nfs_path }}/{{ ctld_list[0] }}/etc/slurm" "$CTLD_SLURM_DIR_MNT" || {
              echo "[WARN] Failed to mount controller slurm.conf directory, falling back to defaults."
              SRUN_RANGE="$DEFAULT_SRUN_RANGE"
              SLURMD_PORT="$DEFAULT_SLURMD_PORT"
            }

            if [ -f "$SLURM_CONF_PATH" ]; then
              echo "[INFO] Parsing SlurmdPort and SrunPortRange from $SLURM_CONF_PATH"

              SLURMD_PORT=$(grep -iE '^SlurmdPort=' "$SLURM_CONF_PATH" | sed -E 's/^SlurmdPort=//; s/#.*//; s/\s+$//')
              SRUN_RANGE=$(grep -iE '^SrunPortRange=' "$SLURM_CONF_PATH" | sed -E 's/^SrunPortRange=//; s/#.*//; s/\s+$//')

              [ -z "$SLURMD_PORT" ] && SLURMD_PORT="$DEFAULT_SLURMD_PORT" && echo "[WARN] SlurmdPort not found in slurm.conf, using default $SLURMD_PORT"
              [ -z "$SRUN_RANGE" ] && SRUN_RANGE="$DEFAULT_SRUN_RANGE" && echo "[WARN] SrunPortRange not found in slurm.conf, using default $SRUN_RANGE"
            else
              echo "[WARN] slurm.conf not found at $SLURM_CONF_PATH, using defaults."
              SRUN_RANGE="$DEFAULT_SRUN_RANGE"
              SLURMD_PORT="$DEFAULT_SLURMD_PORT"
            fi

            echo "[INFO] Using SlurmdPort=$SLURMD_PORT and SrunPortRange=$SRUN_RANGE for firewall configuration"

            echo "[INFO] Configuring firewall rules for SSH and Slurm ports"
            firewall-cmd --permanent --add-service=ssh
            firewall-cmd --permanent --add-port="${SRUN_RANGE}"/tcp
            firewall-cmd --permanent --add-port="${SLURMD_PORT}"/tcp
            
            # Add PXE network to trusted zone for ORTE communication
            echo "[INFO] Adding PXE network to trusted zone for ORTE communication"
            # Calculate PXE subnet using admin IP and netmask bits
            ADMIN_IP="{{ hostvars['localhost']['admin_nic_ip'] }}"
            NETMASK_BITS="{{ hostvars['localhost']['admin_netmask_bits'] }}"
            
            # Convert IP to integer and calculate network address
            ip_to_int() {
              local IFS=.
              read -r a b c d <<< "$1"
              echo $(( (a << 24) + (b << 16) + (c << 8) + d ))
            }
            
            int_to_ip() {
              local ip=$1
              echo "$(( (ip >> 24) & 255 )).$(( (ip >> 16) & 255 )).$(( (ip >> 8) & 255 )).$(( ip & 255 ))"
            }
            
            ADMIN_IP_INT=$(ip_to_int "$ADMIN_IP")
            HOST_BITS=$(( 32 - NETMASK_BITS ))
            HOST_MASK=$(( (1 << HOST_BITS) - 1 ))
            NETWORK_MASK=$(( ~HOST_MASK & 0xFFFFFFFF ))
            NETWORK_INT=$(( ADMIN_IP_INT & NETWORK_MASK ))
            NETWORK_IP=$(int_to_ip "$NETWORK_INT")
            
            PXE_SUBNET="$NETWORK_IP/$NETMASK_BITS"
            echo "[INFO] Admin IP: $ADMIN_IP, Netmask: /$NETMASK_BITS, PXE Subnet: $PXE_SUBNET"
            firewall-cmd --zone=trusted --add-source="$PXE_SUBNET" --permanent
            
            firewall-cmd --reload

            echo "[INFO] Unmounting controller slurm.conf directory from $CTLD_SLURM_DIR_MNT"
            umount "$CTLD_SLURM_DIR_MNT" 2>/dev/null || echo "[WARN] Failed to unmount $CTLD_SLURM_DIR_MNT (may not have been mounted)"

            echo "[INFO] Enabling and starting core services: sshd, munge, slurmd"
            systemctl enable sshd
            systemctl start sshd
            systemctl enable munge
            systemctl start munge
            systemctl enable slurmd
            systemctl start slurmd

            echo "[INFO] Reloading systemd daemon and restarting sshd"
            systemctl daemon-reexec
            systemctl restart sshd
            systemctl restart slurmd

            echo "[INFO] ===== Completed firewall and service configuration (aarch64) ====="

        - path: /etc/hosts
          append: true
          content: |
{% for key in ip_name_map | sort %}
            {{ ip_name_map[key] }} {{ key }}
{% endfor %}

        - path: /etc/sysconfig/slurmd
          owner: root:root
          permissions: '0644'
          content: |
            SLURMD_OPTIONS="{{ conf_server }}"

        - path: /usr/local/bin/check_slurm_controller_status.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/slurm/check_slurm_controller_status.sh.j2') | indent(12) }}

        - path: /tmp/apptainer_mirror.conf
          permissions: '0644'
          content: |
            {{ lookup('template', 'templates/nodes/apptainer_mirror.conf.j2') | indent(12) }}
        
        - path: /usr/local/bin/configure_ucx_openmpi_env.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/hpc_tools/configure_ucx_openmpi_env.sh.j2') | indent(12) }}

        - path: /usr/local/bin/setup_nvhpc_sdk.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/hpc_tools/setup_nvhpc_sdk.sh.j2') | indent(12) }}

        - path: /usr/local/bin/export_nvhpc_env.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/hpc_tools/export_nvhpc_env.sh.j2') | indent(12) }}

      runcmd:
        - rm -rf /var/lib/cloud/instance
        - /usr/local/bin/set-ssh.sh
        - /usr/local/bin/install_nvidia_driver.sh

        - /usr/local/bin/configure_dirs_and_mounts.sh
        - cp /cert/pulp_webserver.crt /etc/pki/ca-trust/source/anchors && update-ca-trust
        - sed -i 's/^gpgcheck=1/gpgcheck=0/' /etc/dnf/dnf.conf
        - bash /usr/local/bin/doca-install.sh && bash /usr/local/bin/configure-ib-network.sh
        - /usr/local/bin/configure_slurmd_setup.sh
        - /usr/local/bin/configure_munge_and_pam.sh

        - setenforce 0
        - /usr/local/bin/configure_firewall_and_services.sh

{% if hostvars['localhost']['openldap_support'] %}
        - /usr/local/bin/update_ldap_conf.sh
        - mkdir /ldapcerts
        - echo "{{ cloud_init_nfs_path_openldap }}/certs                /ldapcerts       nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path_openldap }}/ldapuser             /home            nfs defaults,_netdev 0 0" >> /etc/fstab
        - chmod {{ file_mode }} /etc/fstab
        - mount -a
        - yes | cp /ldapcerts/* /etc/openldap/certs
        - umount /ldapcerts

        - firewall-cmd --permanent --add-port={{ ldap_starttls_port }}/tcp
        - firewall-cmd --permanent --add-port={{ ldap_ssl_port }}/tcp
        - firewall-cmd --reload

        - setenforce 0
        - authselect select sssd with-mkhomedir --force
        - sudo systemctl enable --now oddjobd.service
        - sudo systemctl enable --now sssd
        - setsebool -P authlogin_nsswitch_use_ldap on
        - setsebool -P authlogin_yubikey on
        - sudo systemctl restart sssd
        - systemctl restart sshd

{% endif %}

{% if hostvars['localhost']['ucx_support'] or hostvars['localhost']['openmpi_support'] or hostvars['localhost']['ldms_support'] %}
        # Add NFS entry and mount
        - mkdir -p {{ client_mount_path }}
        - echo "{{ cloud_init_slurm_nfs_path }} {{ client_mount_path }} nfs defaults,_netdev 0 0" >> /etc/fstab
        - mount -a
{% endif %}

{% if hostvars['localhost']['ucx_support'] or hostvars['localhost']['openmpi_support'] %}
        - echo "One or more shared components (UCX / OpenMPI / LDMS) are enabled."
        - /usr/local/bin/configure_ucx_openmpi_env.sh

{% endif %}

{% if hostvars['localhost']['ldms_support'] %}
        - echo " Starting LDMS setup " | tee -a /var/log/ldms-cloudinit.log

        - /root/ldms_sampler.sh
{% endif %}

        - /usr/local/bin/setup_nvhpc_sdk.sh
        - /usr/local/bin/export_nvhpc_env.sh
        - systemctl restart slurmd

        - echo "Cloud-Init has completed successfully."

================================================
FILE: discovery/roles/configure_ochami/templates/cloud_init/ci-group-slurm_node_x86_64.yaml.j2
================================================
- name: {{ functional_group_name }}
  description: "{{ functional_group_name }}"

  file:
    encoding: plain
    content: |
      ## template: jinja
      #cloud-config
      merge_how:
      - name: list
        settings: [append]
      - name: dict
        settings: [no_replace, recurse_list]

      users:
        - name: root
          ssh_authorized_keys: "{{ read_ssh_key.stdout }}"
          lock_passwd: false
          hashed_passwd: "{{ hashed_password_output.stdout }}"
        - name: {{ slurm_user }}
          uid: {{ slurm_uid }}
          system: true
          no_create_home: true
          shell: /sbin/nologin

      disable_root: false

      write_files:
        - path: /usr/local/bin/doca-install.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/doca-ofed/doca-install.sh.j2') | indent(12) }}

        - path: /usr/local/bin/configure-ib-network.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/doca-ofed/configure-ib-network.sh.j2') | indent(12) }}

        - path: /usr/local/bin/set-ssh.sh
          permissions: '{{ file_mode_755 }}'
          content: |
            #!/bin/bash
            timedatectl set-timezone {{ hostvars['oim']['oim_timezone'] }}
            sed -i 's/^#PermitRootLogin.*/PermitRootLogin yes/' /etc/ssh/sshd_config
            sed -i 's/^#PasswordAuthentication.*/PasswordAuthentication yes/' /etc/ssh/sshd_config
            sed -i 's/^PasswordAuthentication.*/PasswordAuthentication yes/' /etc/ssh/sshd_config.d/50-cloud-init.conf
            systemctl restart sshd
            default_count=$(ip route | grep -c "^default")
            if [ "$default_count" -le 1 ]; then
                echo "Only one or no default route found. No action needed."
            else
                private_nic=$(ip route | grep "^default via {{ hostvars['localhost']['admin_nic_ip'] }}" | awk '{print $5}')
                # Get all default routes
                ip route | grep '^default' | while read -r line; do
                    nmcli con del "Wired Connection"
                    # Extract NIC name
                    nic=$(echo "$line" | awk '{print $5}')

                    # Add the default route to the connection
                    if [ -n "$nic" ]; then
                        echo "Adding nmcli device $nic"
                        nmcli con add type ethernet ifname "$nic" con-name "$nic" ipv4.method auto
                        if [ "$nic" = "$private_nic" ]; then
                          nmcli con modify "$nic" ipv4.never-default yes
                          nmcli con delete "cloud-init $nic"
                        fi
                        nmcli con up "$nic"
                    else
                        echo "No connection found for device $nic"
                    fi
                done
            fi
        
        - path: /root/.ssh/config
          permissions: '0600'
          content: |
            Host {{ slurm_control_ssh_patterns }}
                IdentityFile {{ client_mount_path }}/slurm/ssh/oim_rsa
                IdentitiesOnly yes

        - path: /usr/local/bin/install_nvidia_driver.sh
          permissions: '0755'
          content: |
            #!/bin/bash
            LOGFILE="/var/log/nvidia_install.log"
            exec > >(tee -a "$LOGFILE") 2>&1

            echo "===== Starting NVIDIA GPU detection and driver installation ====="

            # Check for NVIDIA GPU presence
            echo "[INFO] Checking for NVIDIA GPU..."
            if ! lspci | grep -i nvidia &>/dev/null; then
                echo "[INFO] No NVIDIA GPU detected. Exiting."
                exit 0
            fi

            echo "[INFO] NVIDIA GPU detected. Proceeding with setup."

            # Check if NVIDIA driver is already installed
            if command -v nvidia-smi &>/dev/null; then
                echo "[INFO] NVIDIA driver already installed. Skipping driver installation."
            else
                echo "[INFO] Mounting NFS runfile directory for driver installation..."
                mkdir -p /gpu-runfile
                mount -t nfs {{ cloud_init_nfs_path }}/hpc_tools/runfile /gpu-runfile

                if [ $? -ne 0 ]; then
                    echo "[ERROR] Failed to mount NFS runfile share. Exiting."
                    exit 1
                fi

                echo "[INFO] Installing NVIDIA driver..."
                if [ -f "/gpu-runfile/{{ cuda_runfile_x86_64 }}" ]; then
                    bash /gpu-runfile/{{ cuda_runfile_x86_64 }} --silent --driver --no-opengl-libs --kernel-source-path=/lib/modules/$(uname -r)/build
                    if [ $? -eq 0 ] && command -v nvidia-smi &>/dev/null; then
                        echo "[SUCCESS] NVIDIA driver installed successfully."
                        nvidia-smi -pm 1
                    else
                        echo "[ERROR] NVIDIA driver installation failed."
                    fi
                else
                    echo "[ERROR] NVIDIA driver runfile not found in /gpu-runfile/"
                fi

                echo "[INFO] Cleaning up temporary NFS mount..."
                umount /gpu-runfile 2>/dev/null
                rmdir /gpu-runfile 2>/dev/null
            fi

            echo "[INFO] Setting up CUDA toolkit mount..."
            # Unmount first if already mounted
            umount /usr/local/cuda 2>/dev/null

            # Create mount point
            mkdir -p /usr/local/cuda

            cuda_nfs_share="{{ cloud_init_nfs_path }}/hpc_tools/cuda"

            echo "[INFO] Mounting CUDA toolkit from NFS: $cuda_nfs_share"
            mount -t nfs "$cuda_nfs_share" /usr/local/cuda

            if [ $? -eq 0 ]; then
                echo "[SUCCESS] CUDA toolkit NFS mount successful"

                # Add to fstab for persistence
                grep -q "$cuda_nfs_share" /etc/fstab || echo "$cuda_nfs_share /usr/local/cuda nfs defaults,_netdev 0 0" >> /etc/fstab

                echo "[INFO] Configuring persistent CUDA environment..."

                # System-wide profile for login shells
                cat > /etc/profile.d/cuda.sh << 'EOF'
            export PATH=/usr/local/cuda/bin:$PATH
            export LD_LIBRARY_PATH=/usr/local/cuda/lib64:$LD_LIBRARY_PATH
            export CUDA_HOME=/usr/local/cuda
            EOF
                chmod +x /etc/profile.d/cuda.sh

                # Bashrc for non-login shells
                cat > /etc/bashrc.cuda << 'EOF'
            if [ -d "/usr/local/cuda/bin" ]; then
                export PATH="/usr/local/cuda/bin:$PATH"
                export LD_LIBRARY_PATH="/usr/local/cuda/lib64:$LD_LIBRARY_PATH"
                export CUDA_HOME="/usr/local/cuda"
            fi
            EOF
                grep -q "bashrc.cuda" /etc/bashrc || echo "source /etc/bashrc.cuda" >> /etc/bashrc

                # Slurm prolog for job environment
                mkdir -p /etc/slurm/prolog.d
                cat > /etc/slurm/prolog.d/cuda.sh << 'EOF'
            #!/bin/bash
            export PATH=/usr/local/cuda/bin:$PATH
            export LD_LIBRARY_PATH=/usr/local/cuda/lib64:$LD_LIBRARY_PATH
            export CUDA_HOME=/usr/local/cuda
            EOF
                chmod +x /etc/slurm/prolog.d/cuda.sh

                # Apply immediately for current session
                export PATH=/usr/local/cuda/bin:$PATH
                export LD_LIBRARY_PATH=/usr/local/cuda/lib64:$LD_LIBRARY_PATH
                export CUDA_HOME=/usr/local/cuda

                echo "[SUCCESS] Persistent CUDA environment configured"
            else
                echo "[ERROR] Failed to mount CUDA toolkit NFS share"
                # Clean up failed mount
                rmdir /usr/local/cuda 2>/dev/null
                exit 1
            fi

            echo "[INFO] Verifying installation..."
            if command -v nvidia-smi &>/dev/null; then
                nvidia_version=$(nvidia-smi --version | head -n1)
                echo "[SUCCESS] NVIDIA driver: $nvidia_version"
            else
                echo "[ERROR] NVIDIA driver not found."
            fi

            if command -v nvcc &>/dev/null; then
                cuda_version=$(nvcc --version | grep "release" | awk '{print $6}' | sed 's/,//')
                echo "[SUCCESS] CUDA toolkit: version $cuda_version"
            else
                echo "[ERROR] CUDA toolkit (nvcc) not found."
            fi

            echo "[INFO] Testing persistence in new shell..."
            bash -c 'nvcc --version > /dev/null 2>&1'
            if [ $? -eq 0 ]; then
                echo "[SUCCESS] CUDA persistence test passed"
            else
                echo "[WARNING] CUDA persistence test failed - manual PATH setup may be needed"
            fi

            echo "===== NVIDIA GPU setup completed ====="


{% if hostvars['localhost']['openldap_support'] %}
        - path: /etc/sssd/sssd.conf
          owner: root:root
          permissions: '0600'
          content: |
            {{ lookup('template', 'templates/openldap/sssd.conf.j2') | indent(6) }}

        - path: /usr/local/bin/update_ldap_conf.sh
          owner: root:root
          permissions: '0755'
          content: |
            {{ lookup('template', 'templates/openldap/update_ldap_conf.sh.j2') | indent(12) }}
{% endif %}

{% if hostvars['localhost']['ldms_support'] %}
        - path: /root/ldms_sampler.sh
          owner: root:root
          permissions: '0755'
          content: |
            {{ lookup('template', 'templates/ldms/ldms_sampler.sh.j2') | indent(12) }}
{% endif %}

        - path: /etc/hosts
          append: true
          content: |
{% for key in ip_name_map | sort %}
            {{ ip_name_map[key] }} {{ key }}
{% endfor %}
        - path: /etc/sysconfig/slurmd
          owner: root:root
          permissions: '0644'
          content: |
            SLURMD_OPTIONS="{{ conf_server }}"

        - path: /usr/local/bin/configure_dirs_and_mounts.sh
          permissions: '{{ file_mode_755 }}'
          content: |
            #!/bin/bash
            LOGFILE="/var/log/configure_dirs_and_mounts.log"
            exec > >(tee -a "$LOGFILE") 2>&1

            echo "[INFO] ===== Starting directory creation and NFS mounts for Pulp cert, Slurm and Munge ====="
            
            # Ensure Slurm NFS root is mounted at client_mount_path (e.g. /share_omnia)
            mkdir -p {{ client_mount_path }}/slurm/ssh
            echo "[INFO] Creating base directories for Pulp cert, Slurm and Munge"
            mkdir -pv {{ slurm_slurmd_log_dir_effective }} {{ slurm_slurmd_pid_dir_effective }} {{ slurm_slurmd_spool_dir_effective }} {{ slurm_epilog_dirs_all | join(' ') }} {% for d in slurm_prolog_dirs_all %}{{ d }} {% endfor %}/etc/munge /cert /var/log/track /var/lib/packages /hpc_tools/container_images /hpc_tools/scripts

            echo "[INFO] Updating /etc/fstab with NFS entries for Pulp cert, Slurm and Munge paths"
            echo "{{ cloud_init_nfs_path }}/cert  /cert   nfs defaults,_netdev 0 0" >> /etc/fstab
            echo "{{ cloud_init_nfs_path }}/$(hostname -s)/var/log/slurm  {{ slurm_slurmd_log_dir_effective }}   nfs defaults,_netdev 0 0" >> /etc/fstab
            echo "{{ cloud_init_nfs_path }}/$(hostname -s)/var/spool/slurmd      {{ slurm_slurmd_spool_dir_effective }}       nfs defaults,_netdev 0 0" >> /etc/fstab
            echo "{{ cloud_init_nfs_path }}/$(hostname -s)/etc/slurm/epilog.d     /etc/slurm/epilog.d      nfs defaults,_netdev 0 0" >> /etc/fstab
            echo "{{ cloud_init_nfs_path }}/$(hostname -s)/etc/munge      /etc/munge       nfs defaults,_netdev 0 0" >> /etc/fstab
            echo "{{ trackfile_nfs_path }}    /var/log/track       nfs defaults,_netdev 0 0" >> /etc/fstab
            echo "{{ cloud_init_nfs_path}}/hpc_tools/container_images  /hpc_tools/container_images   nfs defaults,_netdev 0 0" >> /etc/fstab
            echo "{{ cloud_init_nfs_path}}/hpc_tools/scripts  /hpc_tools/scripts   nfs defaults,_netdev 0 0" >> /etc/fstab
            echo "{{ cloud_init_nfs_path }}/packages  /var/lib/packages   nfs defaults,_netdev 0 0" >> /etc/fstab
            echo "{{ cloud_init_nfs_path }}/ssh {{ client_mount_path }}/slurm/ssh nfs defaults,_netdev 0 0" >> /etc/fstab
            echo "{{ cloud_init_slurm_nfs_path }} {{ client_mount_path }} nfs defaults,_netdev 0 0" >> /etc/fstab
            chmod {{ file_mode }} /etc/fstab

            echo "[INFO] Mounting all NFS entries from /etc/fstab"
            mount -av
            mkdir -p /etc/containers/registries.conf.d
            mv /tmp/apptainer_mirror.conf /etc/containers/registries.conf.d/apptainer_mirror.conf

            echo "[INFO] ===== Completed directory creation and NFS mounts for Slurm and Munge ====="

        - path: /usr/local/bin/configure_slurmd_setup.sh
          permissions: '{{ file_mode_755 }}'
          content: |
            #!/bin/bash
            LOGFILE="/var/log/configure_slurmd_setup.log"
            exec > >(tee -a "$LOGFILE") 2>&1

            echo "[INFO] ===== Starting slurmd setup (service file, directories, epilog) ====="

            bash /usr/local/bin/check_slurm_controller_status.sh

            echo "[INFO] Setting ownership for Slurm directories"
            chown -R {{ slurm_user }}:{{ slurm_user }} {{ slurm_slurmd_log_dir_effective }}
            chown -R {{ slurm_user }}:{{ slurm_user }} {{ slurm_slurmd_pid_dir_effective }}
            chown -R {{ slurm_user }}:{{ slurm_user }} {{ slurm_slurmd_spool_dir_effective }}

            echo "[INFO] Setting permissions for Slurm directories"
            chmod {{ file_mode_755 }} {{ slurm_slurmd_log_dir_effective }} {{ slurm_slurmd_pid_dir_effective }} {{ slurm_slurmd_spool_dir_effective }}

            echo "[INFO] Ensuring Slurm epilog directory and logout script permissions"
            chmod {{ file_mode_755 }} /etc/slurm/epilog.d/
            chmod {{ file_mode_755 }} /etc/slurm/epilog.d/logout_user.sh
{% for epath in slurm_epilog_custom_paths %}

            echo "[INFO] Checking custom epilog script: {{ epath }}"
            if [ ! -f "{{ epath }}" ]; then
              echo "[INFO] Creating stub epilog script at {{ epath }}"
              mkdir -p "$(dirname '{{ epath }}')"
              printf '#!/bin/bash\n# Custom epilog script placeholder\n# Add your epilog commands here\n' > "{{ epath }}"
              chown {{ slurm_user }}:{{ slurm_user }} "{{ epath }}"
              chmod {{ file_mode_755 }} "{{ epath }}"
            fi
{% endfor %}
{% for ppath in slurm_prolog_custom_paths %}

            echo "[INFO] Checking custom prolog script: {{ ppath }}"
            if [ ! -f "{{ ppath }}" ]; then
              echo "[INFO] Creating stub prolog script at {{ ppath }}"
              mkdir -p "$(dirname '{{ ppath }}')"
              printf '#!/bin/bash\n# Custom prolog script placeholder\n# Add your prolog commands here\n' > "{{ ppath }}"
              chown {{ slurm_user }}:{{ slurm_user }} "{{ ppath }}"
              chmod {{ file_mode_755 }} "{{ ppath }}"
            fi
{% endfor %}

            echo "[INFO] Creating and configuring slurmd spool directory"
            mkdir -p {{ slurm_slurmd_spool_dir_effective }}
            chmod {{ file_mode_755 }} {{ slurm_slurmd_spool_dir_effective }}
            chown -R {{ slurm_user }}:{{ slurm_user }} {{ slurm_slurmd_spool_dir_effective }}

            echo "[INFO] ===== Completed slurmd setup ====="

        - path: /usr/local/bin/configure_munge_and_pam.sh
          permissions: '{{ file_mode_755 }}'
          content: |
            #!/bin/bash
            LOGFILE="/var/log/configure_munge_and_pam.log"
            exec > >(tee -a "$LOGFILE") 2>&1

            echo "[INFO] ===== Starting Munge key and PAM configuration ====="

            echo "[INFO] Setting ownership and permissions for Munge key"
            chown -R {{ munge_user }}:{{ munge_group }} /etc/munge/munge.key
            chmod {{ file_mode_400 }} /etc/munge/munge.key

            echo "[INFO] Updating PAM configuration for pam_slurm_adopt in /etc/pam.d/sshd"
            sed -i '/^password\s\+include\s\+password-auth/i account    required    pam_slurm_adopt.so action_no_jobs=deny' /etc/pam.d/sshd

            echo "[INFO] ===== Completed Munge key and PAM configuration ====="

            
        - path: /usr/local/bin/configure_firewall_and_services.sh
          permissions: '{{ file_mode_755 }}'
          content: |
            #!/bin/bash
            LOGFILE="/var/log/configure_firewall_and_services.log"
            exec > >(tee -a "$LOGFILE") 2>&1

            echo "[INFO] ===== Starting firewall and service configuration ====="

            echo "[INFO] Enabling and starting firewalld"
            systemctl enable firewalld
            systemctl start firewalld

            # Default values in case parsing slurm.conf fails
            DEFAULT_SRUN_RANGE="60001-63000"
            DEFAULT_SLURMD_PORT="6818"

            CTLD_SLURM_DIR_MNT="/mnt/slurm_ctld_etc_slurm"
            SLURM_CONF_PATH="$CTLD_SLURM_DIR_MNT/slurm.conf"

            echo "[INFO] Mounting controller slurm.conf from NFS: {{ cloud_init_nfs_path }}/{{ ctld_list[0] }}/etc/slurm -> $CTLD_SLURM_DIR_MNT"
            mkdir -p "$CTLD_SLURM_DIR_MNT"
            mount -t nfs "{{ cloud_init_nfs_path }}/{{ ctld_list[0] }}/etc/slurm" "$CTLD_SLURM_DIR_MNT" || {
              echo "[WARN] Failed to mount controller slurm.conf directory, falling back to defaults."
              SRUN_RANGE="$DEFAULT_SRUN_RANGE"
              SLURMD_PORT="$DEFAULT_SLURMD_PORT"
            }

            if [ -f "$SLURM_CONF_PATH" ]; then
              echo "[INFO] Parsing SlurmdPort and SrunPortRange from $SLURM_CONF_PATH"

              SLURMD_PORT=$(grep -iE '^SlurmdPort=' "$SLURM_CONF_PATH" | sed -E 's/^SlurmdPort=//; s/#.*//; s/\s+$//')
              SRUN_RANGE=$(grep -iE '^SrunPortRange=' "$SLURM_CONF_PATH" | sed -E 's/^SrunPortRange=//; s/#.*//; s/\s+$//')

              [ -z "$SLURMD_PORT" ] && SLURMD_PORT="$DEFAULT_SLURMD_PORT" && echo "[WARN] SlurmdPort not found in slurm.conf, using default $SLURMD_PORT"
              [ -z "$SRUN_RANGE" ] && SRUN_RANGE="$DEFAULT_SRUN_RANGE" && echo "[WARN] SrunPortRange not found in slurm.conf, using default $SRUN_RANGE"
            else
              echo "[WARN] slurm.conf not found at $SLURM_CONF_PATH, using defaults."
              SRUN_RANGE="$DEFAULT_SRUN_RANGE"
              SLURMD_PORT="$DEFAULT_SLURMD_PORT"
            fi

            echo "[INFO] Using SlurmdPort=$SLURMD_PORT and SrunPortRange=$SRUN_RANGE for firewall configuration"

            echo "[INFO] Configuring firewall rules for SSH and Slurm ports"
            firewall-cmd --permanent --add-service=ssh
            firewall-cmd --permanent --add-port="${SRUN_RANGE}"/tcp
            firewall-cmd --permanent --add-port="${SLURMD_PORT}"/tcp
            
            # Add PXE network to trusted zone for ORTE communication
            echo "[INFO] Adding PXE network to trusted zone for ORTE communication"
            # Calculate PXE subnet using admin IP and netmask bits
            ADMIN_IP="{{ hostvars['localhost']['admin_nic_ip'] }}"
            NETMASK_BITS="{{ hostvars['localhost']['admin_netmask_bits'] }}"
            
            # Convert IP to integer and calculate network address
            ip_to_int() {
              local IFS=.
              read -r a b c d <<< "$1"
              echo $(( (a << 24) + (b << 16) + (c << 8) + d ))
            }
            
            int_to_ip() {
              local ip=$1
              echo "$(( (ip >> 24) & 255 )).$(( (ip >> 16) & 255 )).$(( (ip >> 8) & 255 )).$(( ip & 255 ))"
            }
            
            ADMIN_IP_INT=$(ip_to_int "$ADMIN_IP")
            HOST_BITS=$(( 32 - NETMASK_BITS ))
            HOST_MASK=$(( (1 << HOST_BITS) - 1 ))
            NETWORK_MASK=$(( ~HOST_MASK & 0xFFFFFFFF ))
            NETWORK_INT=$(( ADMIN_IP_INT & NETWORK_MASK ))
            NETWORK_IP=$(int_to_ip "$NETWORK_INT")
            
            PXE_SUBNET="$NETWORK_IP/$NETMASK_BITS"
            echo "[INFO] Admin IP: $ADMIN_IP, Netmask: /$NETMASK_BITS, PXE Subnet: $PXE_SUBNET"
            firewall-cmd --zone=trusted --add-source="$PXE_SUBNET" --permanent
            
            firewall-cmd --reload

            echo "[INFO] Unmounting controller slurm.conf directory from $CTLD_SLURM_DIR_MNT"
            umount "$CTLD_SLURM_DIR_MNT" 2>/dev/null || echo "[WARN] Failed to unmount $CTLD_SLURM_DIR_MNT (may not have been mounted)"

            echo "[INFO] Enabling and starting core services: sshd, munge, slurmd"
            systemctl enable sshd
            systemctl start sshd
            systemctl enable munge
            systemctl start munge
            systemctl enable slurmd
            systemctl start slurmd
            
            echo "[INFO] Reloading systemd daemon and restarting sshd"
            systemctl daemon-reexec
            systemctl restart sshd
            systemctl restart slurmd

            echo "[INFO] ===== Completed firewall and service configuration ====="

        - path: /usr/local/bin/check_slurm_controller_status.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/slurm/check_slurm_controller_status.sh.j2') | indent(12) }}

        - path: /tmp/apptainer_mirror.conf
          permissions: '0644'
          content: |
            {{ lookup('template', 'templates/nodes/apptainer_mirror.conf.j2') | indent(12) }}
        
        - path: /usr/local/bin/configure_ucx_openmpi_env.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/hpc_tools/configure_ucx_openmpi_env.sh.j2') | indent(12) }}

        - path: /usr/local/bin/setup_nvhpc_sdk.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/hpc_tools/setup_nvhpc_sdk.sh.j2') | indent(12) }}

        - path: /usr/local/bin/export_nvhpc_env.sh
          owner: root:root
          permissions: '{{ file_mode_755 }}'
          content: |
            {{ lookup('template', 'templates/hpc_tools/export_nvhpc_env.sh.j2') | indent(12) }}

      runcmd:
        - rm -rf /var/lib/cloud/instance
        - /usr/local/bin/set-ssh.sh
        - /usr/local/bin/install_nvidia_driver.sh
        # slurm user and group created in the users module

        - /usr/local/bin/configure_dirs_and_mounts.sh
        - cp /cert/pulp_webserver.crt /etc/pki/ca-trust/source/anchors && update-ca-trust
        - sed -i 's/^gpgcheck=1/gpgcheck=0/' /etc/dnf/dnf.conf

        - bash /usr/local/bin/doca-install.sh && bash /usr/local/bin/configure-ib-network.sh
        - /usr/local/bin/configure_slurmd_setup.sh
        - /usr/local/bin/configure_munge_and_pam.sh

        - setenforce 0
        - /usr/local/bin/configure_firewall_and_services.sh

{% if hostvars['localhost']['openldap_support'] %}
        - /usr/local/bin/update_ldap_conf.sh
        - mkdir /ldapcerts
        - echo "{{ cloud_init_nfs_path_openldap }}/certs                /ldapcerts       nfs defaults,_netdev 0 0" >> /etc/fstab
        - echo "{{ cloud_init_nfs_path_openldap }}/ldapuser             /home            nfs defaults,_netdev 0 0" >> /etc/fstab
        - chmod {{ file_mode }} /etc/fstab
        - mount -a
        - yes | cp /ldapcerts/* /etc/openldap/certs
        - umount /ldapcerts

        - firewall-cmd --permanent --add-port={{ ldap_starttls_port }}/tcp
        - firewall-cmd --permanent --add-port={{ ldap_ssl_port }}/tcp
        - firewall-cmd --reload

        - setenforce 0
        - authselect select sssd with-mkhomedir --force
        - sudo systemctl enable --now oddjobd.service
        - sudo systemctl enable --now sssd
        - setsebool -P authlogin_nsswitch_use_ldap on
        - setsebool -P authlogin_yubikey on
        - sudo systemctl restart sssd
        - systemctl restart sshd

{% endif %}

{% if hostvars['localhost']['ucx_support'] or hostvars['localhost']['openmpi_support'] or hostvars['localhost']['ldms_support'] %}
        # Add NFS entry and mount
        - mkdir -p {{ client_mount_path }}
        - echo "{{ cloud_init_slurm_nfs_path }} {{ client_mount_path }} nfs defaults,_netdev 0 0" >> /etc/fstab
        - mount -a
        # - echo "One or more shared components (UCX / OpenMPI / LDMS) are enabled."
        # - /usr/local/bin/configure_ucx_openmpi_env.sh

{% endif %}

{% if hostvars['localhost']['ucx_support'] or hostvars['localhost']['openmpi_support'] %}
        - echo "One or more shared components (UCX / OpenMPI / LDMS) are enabled."
        - /usr/local/bin/configure_ucx_openmpi_env.sh

{% endif %}

{% if hostvars['localhost']['ldms_support'] %}
        - echo " Starting LDMS setup " | tee -a /var/log/ldms-cloudinit.log

        - /root/ldms_sampler.sh
{% endif %}
        - /usr/local/bin/setup_nvhpc_sdk.sh
        - /usr/local/bin/export_nvhpc_env.sh
        - systemctl restart slurmd

        - echo "Cloud-Init has completed successfully."

================================================
FILE: discovery/roles/configure_ochami/templates/doca-ofed/configure-ib-network.sh.j2
================================================
#!/bin/bash
set -euo pipefail

# Check if Mellanox hardware is present
if ! lspci | grep -i 'mellanox'; then
    echo "No Mellanox RDMA hardware detected. Skipping IB network configuration."
    exit 0
fi

ADMIN_NIC_IP="{% raw %}{{ ds.meta_data.instance_data.local_ipv4 }}{% endraw %}"
NETMASK_BITS="{{ hostvars['localhost']['admin_netmask_bits'] }}"
IB_NETWORK_SUBNET="{{ hostvars['localhost']['ib_network_subnet'] }}"

ip_to_int() {
  local IFS=.
  read -r a b c d <<< "$1"
  echo $(( (a << 24) + (b << 16) + (c << 8) + d ))
}

int_to_ip() {
  local ip=$1
  echo "$(( (ip >> 24) & 255 )).$(( (ip >> 16) & 255 )).$(( (ip >> 8) & 255 )).$(( ip & 255 ))"
}


ADMIN_IP_INT=$(ip_to_int "$ADMIN_NIC_IP")
IB_NET_INT=$(ip_to_int "$IB_NETWORK_SUBNET")

HOST_BITS=$(( 32 - NETMASK_BITS ))
HOST_MASK=$(( (1 << HOST_BITS) - 1 ))

HOST_OFFSET=$(( ADMIN_IP_INT & HOST_MASK ))
IB_IP_INT=$(( IB_NET_INT + HOST_OFFSET ))

IB_IP=$(int_to_ip "$IB_IP_INT")

echo "Derived IB IP : $IB_IP/$NETMASK_BITS"

MAX_WAIT=120        # total wait time in seconds (2 minutes)
INTERVAL=10         # check every 10 seconds
ELAPSED=0
IB_NIC=""

while [[ $ELAPSED -lt $MAX_WAIT ]]; do
  for nic in $(ip -o link show | awk -F': ' '{print $2}' | grep '^ib'); do
    if ip link show "$nic" | grep -q "UP,LOWER_UP"; then
      IB_NIC="$nic"
      break 2
    fi
  done

  echo "IB interface not ready yet. Waiting..."
  sleep $INTERVAL
  ELAPSED=$((ELAPSED + INTERVAL))
done

if [[ -z "$IB_NIC" ]]; then
  echo "No active InfiniBand interface found after ${MAX_WAIT}s. Exiting."
  exit 0
fi

echo "Using IB interface: $IB_NIC"

if command -v nmcli >/dev/null 2>&1; then
  echo "Configuring IB interface using NetworkManager"
  nmcli con delete "$IB_NIC" &>/dev/null || true
  nmcli con add type infiniband ifname "$IB_NIC" con-name "$IB_NIC"
  nmcli con modify "$IB_NIC" ipv4.method manual ipv4.addresses "$IB_IP/$NETMASK_BITS"
  nmcli con up "$IB_NIC"
else
  echo "Configuring IB interface using iproute2"
  ip addr flush dev "$IB_NIC"
  ip addr add "$IB_IP/$NETMASK_BITS" dev "$IB_NIC"
  ip link set "$IB_NIC" up
fi

echo "SUCCESS: Assigned $IB_IP/$NETMASK_BITS to $IB_NIC"
 

================================================
FILE: discovery/roles/configure_ochami/templates/doca-ofed/doca-install.sh.j2
================================================
#!/bin/bash
set -euo pipefail

# Optimize firewall ports declaration later
DOCA_FIREWALL_PORTS=(
  "18515-18520/tcp"
  "18515-18520/udp"
  "18515/tcp"
  "18515/udp"
)

echo "Checking for Mellanox / ConnectX / InfiniBand card..."

if ! lspci | grep -i 'mellanox'; then
    echo "No Mellanox RDMA hardware detected. Skipping DOCA-OFED installation."
    exit 0
fi

echo "Mellanox RDMA hardware detected. Proceeding with DOCA-OFED installation."

sys_arch="$(uname -m)"
case "${sys_arch}" in
    x86_64|amd64) arch="x86_64" ;;
    aarch64|arm64) arch="aarch64" ;;
    *)
        echo "Unsupported architecture: ${sys_arch}"
        exit 1
        ;;
esac

echo "Check if kernel-devel package is present"
if rpm -q kernel-devel-$(uname -r) >/dev/null 2>&1; then
    echo "kernel-devel package is already installed."
else
    echo "kernel-devel package is not installed. Installing..."
    dnf install -y kernel-devel-$(uname -r)
fi

echo "Check if kernel-headers package is present"
if rpm -q kernel-headers-$(uname -r) >/dev/null 2>&1; then
    echo "kernel-headers package is already installed."
else
    echo "kernel-headers package is not installed. Installing..."
    dnf install -y kernel-headers-$(uname -r)
fi

echo "Installing doca-ofed..."
if rpm -q doca-ofed >/dev/null 2>&1; then
    echo "doca-ofed package is already installed."
else
    echo "doca-ofed package is not installed. Installing..."
    dnf install -y doca-ofed
fi

echo "Unloading RDMA kernel modules..."
rmmod bnxt_re || true
rmmod mlx5_ib    || true
rmmod ib_uverbs  || true
rmmod xpmem      || true
rmmod ib_core    || true
rmmod mlx5_core  || true

echo "Loading RDMA kernel modules..."
modprobe mlx5_core || true
modprobe mlx5_ib || true
modprobe ib_core || true
modprobe ib_uverbs || true
modprobe ib_umad || true
modprobe ib_cm || true
modprobe rdma_cm || true
modprobe rdma_ucm || true
modprobe xpmem || true
modprobe knem || true
modprobe ib_ipoib || true

if command -v firewall-cmd &>/dev/null; then
    echo "Adding firewall ports..."

    for port in "${DOCA_FIREWALL_PORTS[@]}"; do
        firewall-cmd --zone=public --add-port="$port" --permanent || true
    done

    firewall-cmd --reload || true
else
    echo "firewalld not running. Skipping firewall configuration."
fi

echo "DOCA-OFED installation completed successfully."
 

================================================
FILE: discovery/roles/configure_ochami/templates/hpc_tools/configure_nvhpc_env.sh.j2
================================================
#!/bin/bash
set -e

LOGFILE="/var/log/nvhpc_env_config.log"
exec >> "$LOGFILE" 2>&1

echo "===== Configuring NVIDIA HPC SDK environment ====="

# Cloud-init safe defaults
export HOME=/root

NVCOMPILERS="/opt/nvidia/nvhpc"
NVARCH="$(uname -s)_$(uname -m)"
sys_arch="$(uname -m)"
case "${sys_arch}" in
    x86_64|amd64) arch="x86_64" ;;
    aarch64|arm64) arch="aarch64" ;;
esac

# Select package name based on detected architecture (rendered from slurm_config vars)
case "${arch}" in
    x86_64)  NVHPC_PKG_NAME="{{ nvhpc_pkg_name_x86_64 }}" ;;
    aarch64) NVHPC_PKG_NAME="{{ nvhpc_pkg_name_aarch64 }}" ;;
esac

# Derive version from package name
NVHPC_VERSION=$(echo "$NVHPC_PKG_NAME" | sed 's/nvhpc_\([0-9]*_[0-9]*\)_Linux_.*/\1/' | cut -d'_' -f2 | sed 's/\(..\)\(..\)/\1.\2/')


NVHPC_BASE="$NVCOMPILERS/$NVARCH/$NVHPC_VERSION"
PROFILE_FILE="/etc/profile.d/nvhpc.sh"

if [ ! -d "$NVHPC_BASE/compilers/bin" ]; then
    echo "[ERROR] NVHPC compilers not found at $NVHPC_BASE"
    exit 1
fi

echo "[INFO] NVHPC detected at $NVHPC_BASE"
echo "[INFO] Writing persistent environment to $PROFILE_FILE"

cat << EOF > "$PROFILE_FILE"
# NVIDIA HPC SDK environment
export NVCOMPILERS=$NVCOMPILERS
export NVARCH=$NVARCH
export NVHPC_VERSION=$NVHPC_VERSION

export PATH=\$NVCOMPILERS/\$NVARCH/\$NVHPC_VERSION/compilers/bin:\$PATH
export MANPATH=\${MANPATH:-}:\$NVCOMPILERS/\$NVARCH/\$NVHPC_VERSION/compilers/man

# MPI (optional but recommended)
export PATH=\$NVCOMPILERS/\$NVARCH/\$NVHPC_VERSION/comm_libs/mpi/bin:\$PATH
export MANPATH=\${MANPATH:-}:\$NVCOMPILERS/\$NVARCH/\$NVHPC_VERSION/comm_libs/mpi/man

# Modules support (optional)
export MODULEPATH=\$NVCOMPILERS/modulefiles:\${MODULEPATH:-}
EOF

chmod 644 "$PROFILE_FILE"

# Source profile for current shell and all future non-login shells
if [ -f "$PROFILE_FILE" ]; then
    echo "[INFO] Sourcing NVHPC profile for current shell"
    source "$PROFILE_FILE"
    grep -q "nvhpc.sh" /etc/bashrc || echo "source $PROFILE_FILE" >> /etc/bashrc
fi


if ! grep -q "{{ cloud_init_nfs_path }}/hpc_tools/nvidia_sdk/nvhpc" /etc/fstab; then
    echo "[ERROR] NVHPC NFS path not found in /etc/fstab"
    exit 1
fi

echo "[INFO] NVHPC NFS entry found in /etc/fstab"

echo "===== NVHPC environment configuration completed successfully ====="


================================================
FILE: discovery/roles/configure_ochami/templates/hpc_tools/configure_ucx_openmpi_env.sh.j2
================================================
#!/bin/bash
LOGFILE="/var/log/configure_ucx_openmpi_env.log"
exec > >(tee -a "$LOGFILE") 2>&1

echo "===== Configuring UCX / OpenMPI environment (Slurm node) ====="

CLIENT_MOUNT="{{ client_mount_path }}"
UCX_PREFIX="{{ client_mount_path }}/slurm/hpc_tools/benchmarks/ucx"
OPENMPI_PREFIX="{{ client_mount_path }}/slurm/hpc_tools/benchmarks/openmpi"

PROFILE_DIR="/etc/profile.d"

# Ensure client mount exists and is mounted
if ! mountpoint -q "$CLIENT_MOUNT"; then
    echo "[WARN] $CLIENT_MOUNT is not mounted. Skipping UCX/OpenMPI env setup."
    exit 0
fi

# ---------------- UCX ----------------

    cat > "$PROFILE_DIR/ucx.sh" <<EOF
# UCX environment
export UCX_HOME="$UCX_PREFIX"
export PATH="\$UCX_HOME/bin:\$PATH"
export LD_LIBRARY_PATH="\$UCX_HOME/lib:\$LD_LIBRARY_PATH"
EOF

    chmod 644 "$PROFILE_DIR/ucx.sh"
    echo "[SUCCESS] UCX environment enabled"

# ---------------- OpenMPI ----------------
    cat > "$PROFILE_DIR/openmpi.sh" <<EOF
# OpenMPI environment
export OPENMPI_HOME="$OPENMPI_PREFIX"
export PATH="\$OPENMPI_HOME/bin:\$PATH"
export LD_LIBRARY_PATH="\$OPENMPI_HOME/lib:\$LD_LIBRARY_PATH"
export MANPATH="\$OPENMPI_HOME/share/man:\$MANPATH"
EOF

    chmod 644 "$PROFILE_DIR/openmpi.sh"
    echo "[SUCCESS] OpenMPI environment enabled"

echo "===== UCX / OpenMPI environment configuration complete ====="


================================================
FILE: discovery/roles/configure_ochami/templates/hpc_tools/export_nvhpc_env.sh.j2
================================================
#!/bin/bash
set -e

CLIENT_MOUNT="{{ client_mount_path }}"

NVHPC_LOCAL_MOUNT="/opt/nvidia/nvhpc"
NVARCH="$(uname -s)_$(uname -m)"
sys_arch="$(uname -m)"
case "${sys_arch}" in
    x86_64|amd64) arch="x86_64" ;;
    aarch64|arm64) arch="aarch64" ;;
esac

# Select package name based on detected architecture (rendered from slurm_config vars)
case "${arch}" in
    x86_64)  NVHPC_PKG_NAME="{{ nvhpc_pkg_name_x86_64 }}" ;;
    aarch64) NVHPC_PKG_NAME="{{ nvhpc_pkg_name_aarch64 }}" ;;
esac

# Derive version from package name
NVHPC_VERSION=$(echo "$NVHPC_PKG_NAME" | sed 's/nvhpc_\([0-9]*_[0-9]*\)_Linux_.*/\1/' | cut -d'_' -f2 | sed 's/\(..\)\(..\)/\1.\2/')

NVHPC_BASE="$NVHPC_LOCAL_MOUNT/$NVARCH/$NVHPC_VERSION"
PROFILE_FILE="/etc/profile.d/nvhpc.sh"
LOGFILE="/var/log/export_nvhpc_env.log"

# Log everything
exec > >(tee -a "$LOGFILE") 2>&1

# Check that NFS is mounted
if ! mountpoint -q "$CLIENT_MOUNT"; then
    echo "[ERROR] $CLIENT_MOUNT is not mounted."
    echo "        Please mount the NFS path before running export_nvhpc_env.sh"
    exit 1
fi

echo "===== NVHPC environment export started ====="


echo "[INFO] Writing persistent NVHPC profile at $PROFILE_FILE"

# Write environment file system-wide
cat > "$PROFILE_FILE" <<EOF
# NVIDIA HPC SDK environment

export NVCOMPILERS=$NVHPC_LOCAL_MOUNT
export NVARCH=$NVARCH
export NVHPC_VERSION=$NVHPC_VERSION

# Compilers
export PATH=\$NVCOMPILERS/\$NVARCH/\$NVHPC_VERSION/compilers/bin:\$PATH
export MANPATH=\${MANPATH:-}:\$NVCOMPILERS/\$NVARCH/\$NVHPC_VERSION/compilers/man

# MPI support
export PATH=\$NVCOMPILERS/\$NVARCH/\$NVHPC_VERSION/comm_libs/mpi/bin:\$PATH
export MANPATH=\${MANPATH:-}:\$NVCOMPILERS/\$NVARCH/\$NVHPC_VERSION/comm_libs/mpi/man

# Modules
export MODULEPATH=\$NVCOMPILERS/modulefiles:\${MODULEPATH:-}
EOF

chmod 644 "$PROFILE_FILE"


echo "[SUCCESS] NVHPC environment exported successfully"
echo "[INFO] Environment file configured in $PROFILE_FILE"
echo "===== NVHPC export completed ====="


================================================
FILE: discovery/roles/configure_ochami/templates/hpc_tools/install_nvhpc_sdk.sh.j2
================================================
#!/bin/bash
set -e

LOGFILE="/var/log/nvhpc_sdk_install.log"

echo "===== Starting NVIDIA HPC SDK installation =====" | tee -a "$LOGFILE"

sys_arch="$(uname -m)"
case "${sys_arch}" in
    x86_64|amd64) arch="x86_64" ;;
    aarch64|arm64) arch="aarch64" ;;
    *)
        echo "Unsupported architecture: ${sys_arch}"
        exit 1
        ;;
esac

# Select package name based on detected architecture (rendered from slurm_config vars)
case "${arch}" in
    x86_64)  NVHPC_PKG_NAME="{{ nvhpc_pkg_name_x86_64 }}" ;;
    aarch64) NVHPC_PKG_NAME="{{ nvhpc_pkg_name_aarch64 }}" ;;
esac

# Derive version from package name: nvhpc_YYYY_YYMM_Linux_<arch>_cuda_X.Y
NVHPC_VERSION=$(echo "$NVHPC_PKG_NAME" | sed 's/nvhpc_\([0-9]*_[0-9]*\)_Linux_.*/\1/')
NVHPC_SHORT_VERSION=$(echo "$NVHPC_VERSION" | cut -d'_' -f2 | sed 's/\(..\)\(..\)/\1.\2/')

NVHPC_EXPORT="{{ cloud_init_nfs_path }}/hpc_tools/nvidia_sdk"
NVHPC_MOUNT="/shared-nvhpc-sdk"
NVHPC_TARBALL="$NVHPC_MOUNT/${NVHPC_PKG_NAME}.tar.gz"
NVHPC_INSTALL_DIR_NFS="$NVHPC_MOUNT/nvhpc"
NVHPC_LOCAL_MOUNT="/opt/nvidia/nvhpc"
NVHPC_EXTRACT_DIR="$NVHPC_MOUNT/${NVHPC_PKG_NAME}"

# Skip if already mounted
if mountpoint -q "$NVHPC_LOCAL_MOUNT"; then
    echo "[INFO] $NVHPC_LOCAL_MOUNT already mounted. Skipping installation." | tee -a "$LOGFILE"
    exit 0
fi

# Skip if local directory exists
if [ -d "$NVHPC_LOCAL_MOUNT" ]; then
    echo "[INFO] $NVHPC_LOCAL_MOUNT exists. Assuming installed. Skipping." | tee -a "$LOGFILE"
    exit 0
fi

mkdir -p "$NVHPC_MOUNT"
mount -t nfs "$NVHPC_EXPORT" "$NVHPC_MOUNT" >> "$LOGFILE" 2>&1

# Check tarball
echo "[INFO] Checking NVIDIA HPC SDK tarball at $NVHPC_TARBALL..." | tee -a "$LOGFILE"
if [ ! -f "$NVHPC_TARBALL" ]; then
    echo "[ERROR] NVIDIA HPC SDK tarball not found. Skipping installation." | tee -a "$LOGFILE"
    exit 0
fi

# Extract if needed
EXTRACT_SIZE_GB=$(du -sBG "$NVHPC_EXTRACT_DIR" 2>/dev/null | cut -f1 | tr -d 'G')
if [ -d "$NVHPC_EXTRACT_DIR" ] && [ "$EXTRACT_SIZE_GB" -ge 13 ] && [ -f "$NVHPC_EXTRACT_DIR/install" ]; then
    echo "[INFO] NVHPC already extracted. Skipping." | tee -a "$LOGFILE"
else
    echo "[INFO] Extracting NVIDIA HPC SDK tarball..." | tee -a "$LOGFILE"
    tar -xzf "$NVHPC_TARBALL" -C "$NVHPC_MOUNT" \
        --checkpoint=2000 \
        --checkpoint-action=echo="[INFO] Extracting NVHPC... please wait" >> "$LOGFILE" 2>&1
fi

mkdir -p "$NVHPC_INSTALL_DIR_NFS"
INSTALL_BIN_DIR="$NVHPC_INSTALL_DIR_NFS/Linux_${arch}/${NVHPC_SHORT_VERSION}/compilers/bin"

if [ -x "$INSTALL_BIN_DIR/nvc" ]; then
    echo "[INFO] NVHPC already installed. Skipping installer." | tee -a "$LOGFILE"
else
    echo "[INFO] Running NVIDIA HPC SDK installer..." | tee -a "$LOGFILE"
    cd "$NVHPC_EXTRACT_DIR"
    NVHPC_SILENT=true NVHPC_INSTALL_DIR="$NVHPC_INSTALL_DIR_NFS" NVHPC_INSTALL_TYPE=auto ./install >> "$LOGFILE" 2>&1
fi

echo "[SUCCESS] NVIDIA HPC SDK installation completed." | tee -a "$LOGFILE"

# Mount NVHPC locally
mkdir -p "$NVHPC_LOCAL_MOUNT"
NVHPC_INSTALL_EXPORT="{{ cloud_init_nfs_path }}/hpc_tools/nvidia_sdk/nvhpc"
FSTAB_ENTRY="$NVHPC_INSTALL_EXPORT $NVHPC_LOCAL_MOUNT nfs defaults,_netdev 0 0"

if ! grep -qE "^[^#].*$NVHPC_INSTALL_EXPORT[[:space:]]+$NVHPC_LOCAL_MOUNT[[:space:]]+nfs" /etc/fstab; then
    echo "[INFO] Adding NVHPC mount to /etc/fstab" | tee -a "$LOGFILE"
    echo "$FSTAB_ENTRY" >> /etc/fstab
fi

echo "[INFO] Mounting $NVHPC_LOCAL_MOUNT..." | tee -a "$LOGFILE"
mount "$NVHPC_LOCAL_MOUNT" >> "$LOGFILE" 2>&1
echo "[INFO] NVHPC successfully mounted at $NVHPC_LOCAL_MOUNT" | tee -a "$LOGFILE"
echo "CLOUD-INIT: NVIDIA HPC SDK installation completed successfully" | tee -a "$LOGFILE"


================================================
FILE: discovery/roles/configure_ochami/templates/hpc_tools/install_openmpi.sh.j2
================================================
#!/bin/bash
set -e

CLIENT_MOUNT="{{ client_mount_path }}"
OPENMPI_PREFIX="{{ client_mount_path }}/slurm/hpc_tools/benchmarks/openmpi"
OPENMPI_BUILD="{{ client_mount_path }}/slurm/hpc_tools/compile/openmpi"

# Comprehensive logging
LOGFILE="/var/log/openmpi_installation.log"

# Redirect all output to log file
exec > >(tee -a "$LOGFILE") 2>&1

echo "===== OpenMPI Installation Started ====="
echo "Timestamp: $(date '+%Y-%m-%d %H:%M:%S')"
echo "Installation Prefix: $OPENMPI_PREFIX"
echo "Build Directory: $OPENMPI_BUILD"
echo "Log File: $LOGFILE" | tee -a "$LOGFILE"

# Check that NFS is mounted
if ! mountpoint -q "$CLIENT_MOUNT"; then
    echo "[ERROR] $CLIENT_MOUNT is not mounted."
    echo "        Please mount the NFS path before running install_openmpi.sh"
    exit 1
fi

echo "===== OpenMPI build started ====="

mkdir -p "$OPENMPI_BUILD"
cd "$OPENMPI_BUILD"

sys_arch="$(uname -m)"
case "${sys_arch}" in
    x86_64|amd64) arch="x86_64" ;;
    aarch64|arm64) arch="aarch64" ;;
    *)
        echo "Unsupported architecture: ${sys_arch}"
        exit 1
        ;;
esac

if [ ! -f openmpi.tar.gz ]; then
    echo "[INFO] Downloading OpenMPI source code..."
    wget --no-check-certificate \
      https://{{ hostvars['localhost']['admin_nic_ip'] }}:2225/pulp/content/opt/omnia/offline_repo/cluster/${arch}/{{ hostvars['localhost']['cluster_os_type'] }}/{{ hostvars['localhost']['cluster_os_version'] }}/tarball/openmpi/openmpi.tar.gz \
      -O openmpi.tar.gz >> "$LOGFILE" 2>&1
    echo "[INFO] OpenMPI download completed"
else
    echo "[INFO] openmpi.tar.gz already exists, skipping download."
fi

echo "[INFO] Extracting OpenMPI source code..."
tar xzf openmpi.tar.gz >> "$LOGFILE" 2>&1
cd openmpi-*
echo "[INFO] OpenMPI source extracted to $(pwd)"

echo "[INFO] Creating build directory..."
mkdir -p build

# Slurm detection
echo "[INFO] Detecting Slurm integration..."
if sinfo >/dev/null 2>&1; then
  SLURM_FLAG="--with-slurm=yes --with-munge=/usr"
  echo "[INFO] Slurm detected - enabling Slurm integration"
else
  SLURM_FLAG="--with-slurm=no"
  echo "[INFO] Slurm not detected - disabling Slurm integration"
fi

# UCX detection
echo "[INFO] Detecting UCX integration..."
if [ -x "{{ client_mount_path }}/slurm/hpc_tools/benchmarks/ucx/bin/ucx_info" ]; then
  UCX_FLAG="--with-ucx={{ client_mount_path }}/slurm/hpc_tools/benchmarks/ucx"
  echo "[INFO] UCX detected - enabling UCX integration"
else
  UCX_FLAG=""
  echo "[INFO] UCX not detected - proceeding without UCX"
fi

cd build
echo "[INFO] Configuring OpenMPI build..."
echo "[INFO] Configure flags: --prefix=$OPENMPI_PREFIX --enable-mpi1-compatibility --enable-prte-prefix-by-default $SLURM_FLAG $UCX_FLAG"
../configure --prefix="$OPENMPI_PREFIX" \
  --enable-mpi1-compatibility \
  --enable-prte-prefix-by-default \
  $SLURM_FLAG $UCX_FLAG >> "$LOGFILE" 2>&1

echo "[INFO] Building OpenMPI with {{ openmpi_build_threads | default(8) }} threads..."
make -j {{ openmpi_build_threads | default(8) }} >> "$LOGFILE" 2>&1

echo "[INFO] Installing OpenMPI..."
make install >> "$LOGFILE" 2>&1

# Configure OpenMPI environment variables system-wide
OPENMPI_ENV_FILE="/etc/profile.d/openmpi.sh"

echo "[INFO] Setting up OpenMPI environment variables in $OPENMPI_ENV_FILE..."
cat > "$OPENMPI_ENV_FILE" <<EOF
# OpenMPI environment
export OPENMPI_HOME="{{ client_mount_path }}/slurm/hpc_tools/benchmarks/openmpi"
export PATH="\$OPENMPI_HOME/bin:\$PATH"
export LD_LIBRARY_PATH="\$OPENMPI_HOME/lib:\$LD_LIBRARY_PATH"
export MANPATH="\$OPENMPI_HOME/share/man:\$MANPATH"
EOF

chmod 644 "$OPENMPI_ENV_FILE"


# Create installation summary
echo ""
echo "===== OpenMPI Installation Summary ====="
echo "Installation Status: SUCCESS"
echo "Integration Status:"
if [ "$SLURM_FLAG" = "--with-slurm=yes --with-munge=/usr" ]; then
    echo "  - Slurm Integration: ENABLED"
else
    echo "  - Slurm Integration: DISABLED"
fi
if [ -n "$UCX_FLAG" ]; then
    echo "  - UCX Integration: ENABLED"
else
    echo "  - UCX Integration: DISABLED"
fi
echo ""
echo "Log File Created:"
echo "  - Installation Log: $LOGFILE" | tee -a "$LOGFILE"

echo "[INFO] OpenMPI installed under {{ client_mount_path }}/slurm/hpc_tools/benchmarks/openmpi" | tee -a "$LOGFILE"
echo "[INFO] OpenMPI environment configured in $OPENMPI_ENV_FILE" | tee -a "$LOGFILE"

echo "===== OpenMPI Installation Completed =====" | tee -a "$LOGFILE"
echo "Completion Timestamp: $(date '+%Y-%m-%d %H:%M:%S')" | tee -a "$LOGFILE"
echo "CLOUD-INIT: OpenMPI installation completed successfully" | tee -a "$LOGFILE"


================================================
FILE: discovery/roles/configure_ochami/templates/hpc_tools/install_ucx.sh.j2
================================================
#!/bin/bash
set -e

CLIENT_MOUNT="{{ client_mount_path }}"
UCX_PREFIX="{{ client_mount_path }}/slurm/hpc_tools/benchmarks/ucx"
UCX_BUILD="{{ client_mount_path }}/slurm/hpc_tools/compile/ucx"

# Comprehensive logging
LOGFILE="/var/log/ucx_installation.log"

echo "===== UCX Installation Started ====="
echo "Timestamp: $(date '+%Y-%m-%d %H:%M:%S')"
echo "Installation Prefix: $UCX_PREFIX"
echo "Build Directory: $UCX_BUILD"
echo "Log File: $LOGFILE" | tee -a "$LOGFILE"

# Check that NFS is mounted
if ! mountpoint -q "$CLIENT_MOUNT"; then
    echo "[ERROR] $CLIENT_MOUNT is not mounted."
    echo "        Please mount the NFS path before running install_ucx.sh"
    exit 1
fi

echo "===== UCX build started ====="

mkdir -p "$UCX_BUILD"
cd "$UCX_BUILD"

sys_arch="$(uname -m)"
case "${sys_arch}" in
    x86_64|amd64) arch="x86_64" ;;
    aarch64|arm64) arch="aarch64" ;;
    *)
        echo "Unsupported architecture: ${sys_arch}"
        exit 1
        ;;
esac

if [ ! -f ucx.tar.gz ]; then
    echo "[INFO] Downloading UCX source code..."
    wget --no-check-certificate \
      https://{{ hostvars['localhost']['admin_nic_ip'] }}:2225/pulp/content/opt/omnia/offline_repo/cluster/${arch}/{{ hostvars['localhost']['cluster_os_type'] }}/{{ hostvars['localhost']['cluster_os_version'] }}/tarball/ucx/ucx.tar.gz \
      -O ucx.tar.gz >> "$LOGFILE" 2>&1
    echo "[INFO] UCX download completed"
else
    echo "[INFO] ucx.tar.gz already exists, skipping download."
fi

echo "[INFO] Extracting UCX source code..."
tar xzf ucx.tar.gz >> "$LOGFILE" 2>&1
cd ucx-*
echo "[INFO] UCX source extracted to $(pwd)"

echo "[INFO] Creating build directory..."
mkdir -p build
cd build

echo "[INFO] Configuring UCX build..."
../contrib/configure-release --prefix="$UCX_PREFIX" >> "$LOGFILE" 2>&1

echo "[INFO] Building UCX with {{ ucx_build_threads | default(8) }} threads..."
make -j {{ ucx_build_threads | default(8) }} >> "$LOGFILE" 2>&1

echo "[INFO] Installing UCX..."
make install >> "$LOGFILE" 2>&1

# Configure UCX environment variables system-wide
UCX_ENV_FILE="/etc/profile.d/ucx.sh"

echo "[INFO] Setting up UCX environment variables in $UCX_ENV_FILE..."
cat > "$UCX_ENV_FILE" <<EOF
# UCX environment
export UCX_HOME="{{ client_mount_path }}/slurm/hpc_tools/benchmarks/ucx"
export PATH="\$UCX_HOME/bin:\$PATH"
export LD_LIBRARY_PATH="\$UCX_HOME/lib:\$LD_LIBRARY_PATH"
EOF

chmod 644 "$UCX_ENV_FILE"

# Verify installation
echo "[INFO] Verifying UCX installation..."
if [ -f "$UCX_PREFIX/bin/ucx_info" ]; then
    UCX_VERSION=$("$UCX_PREFIX/bin/ucx_info" -v | head -1)
    echo "[SUCCESS] UCX installation verified - Version: $UCX_VERSION" | tee -a "$LOGFILE"
else
    echo "[ERROR] UCX installation verification failed - ucx_info not found" | tee -a "$LOGFILE"
    exit 1
fi

echo "Log File Created:"
echo "  - Installation Log: $LOGFILE" | tee -a "$LOGFILE"

echo "[INFO] UCX installed under {{ client_mount_path }}/slurm/hpc_tools/benchmarks/ucx" | tee -a "$LOGFILE"
echo "[INFO] UCX environment configured in $UCX_ENV_FILE" | tee -a "$LOGFILE"
echo "[INFO] Run 'source $UCX_ENV_FILE' or re-login to use ucx_info" | tee -a "$LOGFILE"

echo "===== UCX Installation Completed =====" | tee -a "$LOGFILE"
echo "Completion Timestamp: $(date '+%Y-%m-%d %H:%M:%S')" | tee -a "$LOGFILE"
echo "CLOUD-INIT: UCX installation completed successfully" | tee -a "$LOGFILE"


================================================
FILE: discovery/roles/configure_ochami/templates/hpc_tools/setup_nvhpc_sdk.sh.j2
================================================
#!/bin/bash
LOGFILE="/var/log/setup_nvhpc_sdk.log"
exec > >(tee -a "$LOGFILE") 2>&1

echo "===== NVHPC SDK setup (mount + wait) ====="

PARENT_NFS="{{ cloud_init_nfs_path }}/hpc_tools/nvidia_sdk"
PARENT_MOUNT="/shared-nvhpc-sdk"

NVHPC_NFS_SHARE="$PARENT_MOUNT/nvhpc"
NVHPC_LOCAL_MOUNT="/opt/nvidia/nvhpc"

mkdir -p "$PARENT_MOUNT"


if ! mountpoint -q "$PARENT_MOUNT"; then
    mount -t nfs "$PARENT_NFS" "$PARENT_MOUNT"
fi

if ! mountpoint -q "$PARENT_MOUNT"; then
    echo "[ERROR] Failed to mount NVHPC parent export"
    exit 1
fi

echo "[INFO] Parent NVHPC export mounted"

mkdir -p "$NVHPC_NFS_SHARE"
# 3. Ensure fstab entry exists (bind mount, NOT NFS)
if ! grep -qF "$NVHPC_NFS_SHARE $NVHPC_LOCAL_MOUNT" /etc/fstab; then
    echo "$NVHPC_NFS_SHARE $NVHPC_LOCAL_MOUNT none bind,_netdev 0 0" >> /etc/fstab
    echo "[INFO] NVHPC bind-mount fstab entry added"
else
    echo "[INFO] NVHPC fstab entry already present"
fi

# 4. Mount NVHPC SDK
mkdir -p "$NVHPC_LOCAL_MOUNT"

if ! mountpoint -q "$NVHPC_LOCAL_MOUNT"; then
    mount --bind "$NVHPC_NFS_SHARE" "$NVHPC_LOCAL_MOUNT"
fi

if ! mountpoint -q "$NVHPC_LOCAL_MOUNT"; then
    echo "[ERROR] Failed to mount NVHPC SDK"
    exit 1
fi

echo "[SUCCESS] NVHPC SDK mounted at $NVHPC_LOCAL_MOUNT"
echo "===== NVHPC setup completed ====="


================================================
FILE: discovery/roles/configure_ochami/templates/ldms/ldms_sampler.sh.j2
================================================
#!/bin/bash
# ============================================================
# LDMS Setup Script
# ============================================================

LOG_FILE="/var/log/ldms-cloudinit.log"
echo "===== Starting LDMS setup =====" | tee -a "$LOG_FILE"

echo "Copying LDMS sampler configuration files..." | tee -a "$LOG_FILE"

# Copy sampler.conf and ldmsauth.conf
for file in sampler.conf ldmsauth.conf; do
    src="{{ client_mount_path }}/ldms/samplers/$file"
    dest="/opt/ovis-ldms/etc/ldms/$file"
    if [ -f "$src" ]; then
        sudo cp -rf "$src" "$dest"
        echo "✓ Copied $file" | tee -a "$LOG_FILE"
    else
        echo "Warning: $file not found in NFS share" | tee -a "$LOG_FILE"
    fi
done

# --- Export LDMS environment variables ---
echo "Sourcing LDMS environment variables..." | tee -a "$LOG_FILE"
if [ -f /opt/ovis-ldms/etc/profile.d/set-ovis-variables.sh ]; then
    source /opt/ovis-ldms/etc/profile.d/set-ovis-variables.sh
else
    echo "Environment file /opt/ovis-ldms/etc/profile.d/set-ovis-variables.sh not found. Continuing..." | tee -a "$LOG_FILE"
fi

# --- Copy LDMS sampler environment file from NFS share ---
echo "Copying LDMS sampler environment file from NFS share..." | tee -a "$LOG_FILE"
if [ -f {{ client_mount_path }}/ldms/samplers/ldmsd.sampler.env ]; then
    sudo cp {{ client_mount_path }}/ldms/samplers/ldmsd.sampler.env /opt/ovis-ldms/etc/ldms/ldmsd.sampler.env
    echo "✓ Copied ldmsd.sampler.env" | tee -a "$LOG_FILE"
else
    echo "Warning: ldmsd.sampler.env not found in NFS share" | tee -a "$LOG_FILE"
fi

# --- Source environment file to get port ---
if [ -f /opt/ovis-ldms/etc/ldms/ldmsd.sampler.env ]; then
    source /opt/ovis-ldms/etc/ldms/ldmsd.sampler.env
    echo "✓ Sourced ldmsd.sampler.env (Port: $LDMSD_PORT)" | tee -a "$LOG_FILE"
else
    LDMSD_PORT=10001
    echo "Warning: Using default port $LDMSD_PORT" | tee -a "$LOG_FILE"
fi

# --- Configure and enable LDMS service ---
echo "Configuring and enabling LDMS service..." | tee -a "$LOG_FILE"
if [ -f /opt/ovis-ldms/etc/systemd/system/ldmsd.sampler.service ]; then
    sudo cp /opt/ovis-ldms/etc/systemd/system/ldmsd.sampler.service /etc/systemd/system/
    sudo systemctl daemon-reload
    sudo systemctl enable ldmsd.sampler.service
    sudo systemctl start ldmsd.sampler.service
    sudo systemctl status ldmsd.sampler.service --no-pager | tee -a "$LOG_FILE"
else
    echo "Service file not found: /opt/ovis-ldms/etc/systemd/system/ldmsd.sampler.service" | tee -a "$LOG_FILE"
fi

# Configure firewall safely

echo "Configuring firewall for LDMS port $LDMSD_PORT..." | tee -a "$LOG_FILE"
sudo firewall-cmd --permanent --add-port=$LDMSD_PORT/tcp
sudo firewall-cmd --reload

# --- Verify LDMS connection and metrics ---
echo "Verifying LDMS connection and metrics..." | tee -a "$LOG_FILE"
/opt/ovis-ldms/sbin/ldms_ls -a ovis -A conf=/opt/ovis-ldms/etc/ldms/ldmsauth.conf -p $LDMSD_PORT -h localhost | tee -a "$LOG_FILE"
/opt/ovis-ldms/sbin/ldms_ls -l -a ovis -A conf=/opt/ovis-ldms/etc/ldms/ldmsauth.conf -p $LDMSD_PORT -h localhost > /tmp/metrics

echo "===== LDMS setup completed =====" | tee -a "$LOG_FILE"


================================================
FILE: discovery/roles/configure_ochami/templates/nodes/apptainer_mirror.conf.j2
================================================
unqualified-search-registries = ["{{ pulp_mirror }}"]

[[registry]]
prefix = "docker.io"
location = "registry-1.docker.io"
[[registry.mirror]]
location = "{{ pulp_mirror }}"

[[registry]]
prefix = "ghcr.io"
location = "ghcr.io"
[[registry.mirror]]
location = "{{ pulp_mirror }}"

[[registry]]
prefix = "quay.io"
location = "quay.io"
[[registry.mirror]]
location = "{{ pulp_mirror }}"

[[registry]]
prefix = "registry.k8s.io"
location = "registry.k8s.io"
[[registry.mirror]]
location = "{{ pulp_mirror }}"

[[registry]]
prefix = "nvcr.io"
location = "nvcr.io"
[[registry.mirror]]
location = "{{ pulp_mirror }}"

[[registry]]
prefix = "public.ecr.aws"
location = "public.ecr.aws"
[[registry.mirror]]
location = "{{ pulp_mirror }}"

[[registry]]
prefix = "gcr.io"
location = "gcr.io"
[[registry.mirror]]
location = "{{ pulp_mirror }}"


================================================
FILE: discovery/roles/configure_ochami/templates/nodes/bmc_group_data.csv.j2
================================================
BMC_IP,GROUP_NAME,PARENT
{% if hostvars['localhost']['Networks'][0].admin_network.primary_oim_bmc_ip %}
{{ hostvars['localhost']['Networks'][0].admin_network.primary_oim_bmc_ip }},,
{% endif %}
{% for item in nodes | sort(attribute='value.XNAME') %}
{{ item.value.BMC_IP }},{{ item.value.GROUP_NAME }},{{ group_data[item.value.GROUP_NAME].parent | default('') }}
{% endfor %}


================================================
FILE: discovery/roles/configure_ochami/templates/nodes/groups.yaml.j2
================================================
- label: {{ functional_group_name }}
  members:
    ids:
{% for item in nodes | sort(attribute='value.XNAME') %}
{% if item.value.FUNCTIONAL_GROUP_NAME == functional_group_name %}
      - {{ item.value.XNAME }}
{% endif %}
{% endfor %}


================================================
FILE: discovery/roles/configure_ochami/templates/nodes/groups_common.yaml.j2
================================================
- label: {{ common_group_name }}
  members:
    ids:
{% for item in nodes | sort(attribute='value.XNAME') %}
      - {{ item.value.XNAME }}
{% endfor %}

================================================
FILE: discovery/roles/configure_ochami/templates/nodes/hostname.yaml.j2
================================================
{% for item in nodes | sort(attribute='value.XNAME') %}
- id: {{ item.value.XNAME }}
  local-hostname: {{ item.value.HOSTNAME }}.{{ hostvars['localhost']['domain_name'] }}
{% endfor %}


================================================
FILE: discovery/roles/configure_ochami/templates/nodes/nodes.yaml.j2
================================================
nodes:
{% for item in nodes | sort(attribute='value.XNAME') %}
- name: {{ item.value.HOSTNAME }}
  xname: {{ item.value.XNAME }}
  description: {{ item.value.SERVICE_TAG }}
  nid: {{ loop.index }}
  group: {{ item.value.FUNCTIONAL_GROUP_NAME }}
  bmc_mac: {{ item.value.BMC_MAC }} 
  bmc_ip: {{ item.value.BMC_IP }}
  interfaces:
  - mac_addr: {{ item.value.ADMIN_MAC }}
    ip_addrs:
    - name: management
      ip_addr: {{ item.value.ADMIN_IP }}
{% endfor %}

================================================
FILE: discovery/roles/configure_ochami/templates/openldap/sssd.conf.j2
================================================
{% if connection_type == "tls" %}

      [sssd]
      services = nss, pam, autofs
      domains = default
      enable_files_domain = false

      [nss]
      homedir_substring = /home

      [pam]

      [domain/default]
      enumerate = true
      id_provider = ldap
      autofs_provider = ldap
      auth_provider = ldap
      chpass_provider = ldap
      ldap_uri =  ldap://{{ ldap_server_ip }}
      ldap_search_base = {{ ldap_search_base }}
      ldap_default_bind_dn = {{ ldap_default_bind_dn }}
      ldap_default_authtok = {{ password }}
      ldap_id_use_start_tls = True
      ldap_tls_cacert = /etc/openldap/certs/ldapserver.crt
      ldap_tls_cacertdir = /etc/openldap/certs
      cache_credentials = True
      ldap_tls_reqcert = allow

{% else %}

      [domain/default]
      id_provider = ldap
      autofs_provider = ldap
      auth_provider = ldap
      chpass_provider = ldap
      ldap_uri = ldaps://{{ ldap_server_ip }}:636
      ldap_chpass_uri = ldaps://{{ ldap_server_ip }}:636
      ldap_search_base = {{ ldap_search_base }}
      ldap_id_use_start_tls = False
      ldap_tls_cacertdir = /etc/openldap/certs
      cache_credentials = True
      ldap_tls_reqcert = demand
      entry_cache_timeout = 600
      ldap_network_timeout = 3
      ldap_connection_expire_timeout = 60
{% endif %}

================================================
FILE: discovery/roles/configure_ochami/templates/openldap/update_ldap_conf.sh.j2
================================================
#!/bin/bash
set -euo pipefail

TYPE="{{ connection_type }}"
FILE="{{ ldap_conf_dest }}"

if [[ "$TYPE" == "tls" ]]; then
  sed -i "s|SASL_NOCANON[[:space:]]*on|SASL_NOCANON on\nBASE    {{ ldap_search_base }}|" "$FILE"
  sed -i "s|SASL_NOCANON[[:space:]]*on|SASL_NOCANON on\nURI     ldap://{{ ldap_server_ip }}|" "$FILE"
  sed -i "s|SASL_NOCANON[[:space:]]*on|SASL_NOCANON on\nTLS_CACERT {{ tls_cert_path }}|" "$FILE"
elif [[ "$TYPE" == "ssl" ]]; then
  sed -i "s|SASL_NOCANON[[:space:]]*on|SASL_NOCANON on\nURI     ldap://{{ ldap_server_ip }}:636|" "$FILE"
fi


================================================
FILE: discovery/roles/configure_ochami/templates/pull_additional_images.yaml.j2
================================================
{# 
  Common template to pull additional images using crictl.
  This template should be included in service_kube role cloud-init files.
  
  Required variable: role_name (e.g., 'service_kube_control_plane', 'service_kube_node', 'service_kube_control_plane_first')
  Uses: additional_images_dict[role_name] - list of dicts with:
    - package: image name
    - tag: image tag (if using tag)
    - digest: image digest (if using digest)
    - pull_ref: complete reference for crictl pull (package:tag or package@digest)
#}
{% if additional_images_dict is defined and additional_images_dict[role_name] is defined and additional_images_dict[role_name] | length > 0 %}
        - |
          echo "Pulling additional_packages.json images for {{ role_name }}..."
          ADDITIONAL_IMAGES=({% for image in additional_images_dict[role_name] %}"{{ image.pull_ref }}"{% if not loop.last %} {% endif %}{% endfor %})
          for img in "${ADDITIONAL_IMAGES[@]}"; do
            echo "Pulling $img..."
            crictl pull "$img" || echo "Failed to pull $img"
          done
          echo "Completed pulling additional images for {{ role_name }}."
{% endif %}


================================================
FILE: discovery/roles/configure_ochami/templates/slurm/check_slurm_controller_status.sh.j2
================================================
#!/bin/bash
CONTROLLER_IP="{{ hostvars['oim']['controller_ip'] }}"
MARKER="/var/log/track/slurm_controller_track"
SERVICE_FILE="/usr/lib/systemd/system/slurmd.service"

echo "Reading slurm controller port from $SERVICE_FILE ..."
EXEC_LINE=$(grep -E "^ExecStart=" "$SERVICE_FILE")
CONTROLLER_PORT=$(echo "$EXEC_LINE" | grep -oP '(?<=--conf-server\s)[^ ]+' | cut -d':' -f2)

if [[ -z "$CONTROLLER_PORT" ]]; then
    echo "WARNING: Could not parse port from service file. Defaulting to 6817."
    CONTROLLER_PORT=6817
fi

echo "Controller port identified as $CONTROLLER_PORT"
echo "Waiting for slurm controller to be reachable..."

while true; do
    if ping -c1 -W1 "$CONTROLLER_IP" &>/dev/null && \
      bash -c "cat < /dev/tcp/$CONTROLLER_IP/$CONTROLLER_PORT" &>/dev/null; then
        echo "Slurm controller reachable and port $CONTROLLER_PORT is open."
        break
    else
        echo "Controller not ready. Retrying in 5 seconds..."
        sleep 5
    fi
done

echo "Waiting for marker file: $MARKER"
while true; do
    if [ -f "$MARKER" ]; then
        echo "Marker file found. Proceeding."
        break
    else
        echo "Marker file not found. Retrying in 5 seconds..."
        sleep 5
    fi
done


================================================
FILE: discovery/roles/configure_ochami/templates/telemetry/telemetry.sh.j2
================================================
kubectl apply -f {{ k8s_client_mount_path }}/telemetry/deployments/telemetry_namespace_creation.yaml
{% if kafka_support %}
helm -n telemetry install strimzi-cluster-operator {{ k8s_client_mount_path }}/telemetry/{{ strimzi_kafka_pkg }}.tar.gz
{% endif %}
kubectl apply -k {{ k8s_client_mount_path }}/telemetry/deployments/.
{% if hostvars['localhost']['ldms_support'] %}
kubectl create secret generic nersc-ldms-ovis-auth   --from-file=ldmsauth.conf={{ k8s_client_mount_path }}/telemetry/ldms/ldmsauth.conf   --dry-run=client -o yaml | kubectl apply -f  - -n telemetry
kubectl create secret generic nersc-munge-key   --from-file=munge.key={{ k8s_client_mount_path }}/telemetry/ldms/munge.key   --dry-run=client -o yaml | kubectl apply -f - -n telemetry
cd {{ k8s_client_mount_path }}/telemetry/ldms/nersc-ldms-aggr && helm install -n telemetry nersc-ldms-aggr nersc-ldms-aggr --values values.yaml
{% endif %}

================================================
FILE: discovery/roles/configure_ochami/vars/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# Usage: discover_mapping_nodes.yml
openchami_nodes_template: "{{ role_path }}/templates/nodes/nodes.yaml.j2"
bmc_group_data_template: "{{ role_path }}/templates/nodes/bmc_group_data.csv.j2"
openchami_share_path: /opt/omnia/openchami
telemetry_share_path: "{{ hostvars['localhost']['oim_shared_path'] }}/omnia/telemetry"
bmc_group_data_file: "{{ telemetry_share_path }}/bmc_group_data.csv"
openchami_work_dir: "{{ hostvars['localhost']['oim_shared_path'] }}/omnia/openchami/workdir"
nodes_dir: "{{ openchami_work_dir }}/nodes"
openchami_config_vars_path: "{{ openchami_share_path }}/configs_vars.yaml"
openchami_groups_template: "{{ role_path }}/templates/nodes/groups.yaml.j2"
openchami_nodes_vars_path: "{{ nodes_dir }}/nodes.yaml"
discover_fail_msg: "Failed to discover nodes. Please verify the inputs provided in mapping file."
openchami_hostname_template: "{{ role_path }}/templates/nodes/hostname.yaml.j2"
openchami_hostname_vars_path: "{{ nodes_dir }}/hostname.yaml"

# Usage: create_groups.yml
openchami_groups_common_template: "{{ role_path }}/templates/nodes/groups_common.yaml.j2"
common_cloud_init_groups:
  - ssh
  - chrony

# Usage: configure_bss_group.yml, configure_bss_cloud_init.yml
bss_template: bss/bss.yaml.j2
bss_dir: "{{ openchami_work_dir }}/boot"
bss_params_cloud_init: 'ds=nocloud;s=http://{{ cluster_boot_ip }}:8081/cloud-init/'
bss_params_opts: 'ip=dhcp rd.live.image rd.live.ram rd.neednet=1 rd.driver.blacklist=ccp,edac_core,power_meter,ahci,megaraid_sas modprobe.blacklist=ccp,edac_core,power_meter,ahci,megaraid_sas libata.force=1:disable,2:disable,3:disable,4:disable rd.luks=0 rd.md=0 rd.dm=0 console=tty0 console=ttyS0,115200 selinux=0 apparmor=0 ip6=off cloud-init=enabled' # noqa: yaml[line-length]
image_missing_fail_msg: "Failed to set kernel or initrd. Create the image using build_image.yml and try again."

# Usage: configure_cloud_init_group.yml, configure_bss_cloud_init.yml
ssh_key_path: /root/.ssh/oim_rsa.pub
ci_defaults_template: cloud_init/ci-defaults.yaml.j2
cloud_init_dir: "{{ openchami_work_dir }}/cloud-init"
ci_defaults_dest: '{{ cloud_init_dir }}/ci-defaults.yaml'
ci_group_load_fail_msg: |
  "Template loading failed. Ensure the template exists in the specified path and is compatible with the defined functional groups."
default_file_path: "{{ playbook_dir }}/roles/slurm_config/defaults/main.yml"
ssh_private_key_path: /root/.ssh/oim_rsa

# Usage: configure_cloud_init_common.yml
ci_group_common_template: cloud_init/ci-group-common.yaml.j2
ci_group_common_dest: "{{ cloud_init_dir }}/ci-group-common.yaml"

# Usage: discovery_completion.yml
discovery_completion_msg: |
  The discovery.yml playbook has completed successfully.
  Next, you can either manually PXE boot the nodes or use the utils/set_pxe_boot.yml playbook
  by specifying a bmc group in your inventory to initiate the PXE boot process.
  Once the nodes have booted, proceed to run telemetry/telemetry.yml to start collecting telemetry data.

# Usage: ci-group-login_node_x86_64.yaml.j2
tls_cert_path: "/etc/openldap/certs/ldapserver.crt"
ldap_conf_dest: "/etc/openldap/ldap.conf"
sasl_nocanon_regxp: "SASL_NOCANON\ton"
sasl_nacanon_replace1: "SASL_NOCANON\ton\nBASE\t{{ hostvars['localhost']['ldap_search_base'] }}"
sasl_nacanon_replace2: "SASL_NOCANON\ton\nURI\tldap://{{ hostvars['localhost']['ldap_server_ip'] }}"
sasl_nacanon_replace3: "SASL_NOCANON\ton\nTLS_CACERT\t{{ tls_cert_path }}"
sasl_nacanon_replace4: "SASL_NOCANON\ton\nURI\tldap://{{ hostvars['localhost']['ldap_server_ip'] }}:636"
file_mode: "0644"
ldap_starttls_port: 389
ldap_ssl_port: 636

# Usage: ci-group-slurm_control_node_x86_64.yaml.j2
home_dir: /var/lib/slurm
user: slurm
munge_user: munge
munge_group: munge
mysql_user: mysql
mysql_group: mysql
file_mode_400: "0400"
file_mode_755: "0755"
file_mode_600: "0600"
ip_timeout: 10
ip_wait_loop: 60

# Hostname lists for stack-specific SSH configs (populated by passwordless_ssh role)
k8s_cluster_hostnames: "{{ hostvars['localhost']['k8s_cluster_hostnames'] | default([]) }}"
slurm_cluster_hostnames: "{{ hostvars['localhost']['slurm_cluster_hostnames'] | default([]) }}"

# IP wildcard lists for stack-specific SSH configs
k8s_cluster_ip_patterns: "{{ hostvars['localhost']['k8s_cluster_ip_patterns'] | default([]) }}"
slurm_cluster_ip_patterns: "{{ hostvars['localhost']['slurm_cluster_ip_patterns'] | default([]) }}"

# SSH Host patterns precomputed on OIM by passwordless_ssh/read_nodes_yaml.yml
slurm_control_ssh_patterns: "{{ hostvars['oim']['slurm_ssh_patterns'] | default('*') }}"
k8s_control_ssh_patterns: "{{ hostvars['oim']['k8s_ssh_patterns'] | default('*') }}"

# Passwordless SSH mode flag derived from nodes.yaml (set on OIM by passwordless_ssh role)
all_group_names_present: "{{ hostvars['oim']['all_group_names_present'] | default(false) }}"

# CUDA/NVIDIA runfile names (extracted from slurm_custom.json in slurm_config role)
cuda_runfile_x86_64: "{{ hostvars['oim']['cuda_runfile_x86_64'] | default('cuda_13.0.2_580.95.05_linux.run') }}"
cuda_runfile_aarch64: "{{ hostvars['oim']['cuda_runfile_aarch64'] | default('cuda_13.0.2_580.95.05_linux_sbsa.run') }}"
# Usage: fetch_additional_images.yml
input_project_dir: "{{ hostvars['localhost']['input_project_dir'] }}"
software_config_file_path: "{{ input_project_dir }}/software_config.json"
local_repo_config_path: "{{ input_project_dir }}/local_repo_config.yml"


================================================
FILE: discovery/roles/discovery_validations/README.md
================================================
# Discovery Validations Role

## Overview
Validates all node discovery-related configuration files and inputs before the discovery process begins.

## Purpose
- Validates discovery input files syntax and structure
- Checks software configuration consistency
- Validates mapping files when mapping-based discovery is used
- Ensures telemetry configuration is correct
- Updates system hosts file with discovered nodes

## Key Tasks
- **Load Credentials**: Securely loads provisioning and BMC credentials
- **Validate Discovery Inputs**: Checks syntax of discovery configuration files
- **Validate Software Config**: Ensures software configuration is consistent
- **Validate Mapping File**: Validates node mapping file (MAC, IP, hostname uniqueness)
- **Update Hosts File**: Updates `/etc/hosts` with node information
- **Validate Telemetry**: Validates telemetry configuration when enabled


================================================
FILE: discovery/roles/discovery_validations/tasks/build_stream_prerequisite.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

- name: Set build_stream_job_id from environment
  ansible.builtin.set_fact:
    build_stream_job_id: "{{ job_id | default(lookup('env', 'job_id') | default('')) }}"

- name: Set image_key from environment
  ansible.builtin.set_fact:
    image_key: "{{ image_key | default(lookup('env', 'image_key') | default('')) }}"

- name: Validate build stream inputs
  ansible.builtin.fail:
    msg: "{{ build_stream_job_id_absent }}"
  when:
    - enable_build_stream | default(false) | bool
    - ((build_stream_job_id | default('') | length) == 0) and ((image_key | default('') | length) == 0)

- name: Set compute_image_suffix
  ansible.builtin.set_fact:
    compute_image_suffix: "{{ (build_stream_job_id ~ '-' ~ (image_key | default(''))) | regex_replace('^-+', '') }}"

- name: Debug compute_image_suffix
  ansible.builtin.debug:
    msg: "{{ compute_image_suffix }}"
    verbosity: 2


================================================
FILE: discovery/roles/discovery_validations/tasks/include_inputs.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Include {{ item.path }}
  block:
    - name: Include {{ item.path }}
      ansible.builtin.include_vars: "{{ item.path }}"
      register: include_input
      tags: init
  rescue:
    - name: Failed to include {{ item.path }}
      ansible.builtin.fail:
        msg: "{{ input_syntax_fail_msg }} Error: {{ include_input.message }}"


================================================
FILE: discovery/roles/discovery_validations/tasks/include_software_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Load software_config.json as software_config
  block:
    - name: Load software_config.json as software_config
      ansible.builtin.include_vars:
        file: "{{ software_config_file }}"
        name: software_config
      register: include_software_config
      no_log: true
  rescue:
    - name: Failed to load software_config.json as software_config
      ansible.builtin.fail:
        msg: "{{ software_config_syntax_fail_msg }} Error: {{ include_software_config.message }}"

- name: Set facts for cluster
  ansible.builtin.set_fact:
    cluster_os_type: "{{ software_config.cluster_os_type }}"
    cluster_os_version: "{{ software_config.cluster_os_version }}"

- name: Parse network_spec data
  ansible.builtin.set_fact:
    network_data: "{{ network_data | default({}) | combine({item.key: item.value}) }}"
  with_dict: "{{ Networks }}"

- name: Set admin network nic and ip
  ansible.builtin.set_fact:
    admin_nic_ip: "{{ network_data.admin_network.primary_oim_admin_ip }}"
    admin_nic: "{{ network_data.admin_network.oim_nic_name }}"
    admin_netmask_bits: "{{ network_data.admin_network.netmask_bits }}"
    ib_network_subnet: "{{ network_data.ib_network.subnet }}"
    dns: "{{ network_data.admin_network.dns }}"

- name: Initialise variables
  ansible.builtin.set_fact:
    service_k8s_support: false

- name: Check if service k8s support is true
  ansible.builtin.set_fact:
    service_k8s_support: "{{ software_config.softwares | selectattr('name', 'equalto', 'service_k8s') | list | length > 0 }}"

- name: Extract k8s version
  ansible.builtin.set_fact:
    service_k8s_version: "{{ software_config.softwares | selectattr('name', 'equalto', 'service_k8s') | map(attribute='version') | first }}"
  when: service_k8s_support

- name: Check if csi support is true
  ansible.builtin.set_fact:
    csi_driver_powerscale_support: "{{ software_config.softwares | selectattr('name', 'equalto', 'csi_driver_powerscale') | list | length > 0 }}"

- name: Initialise openldap support variables
  ansible.builtin.set_fact:
    openldap_support: false

- name: Check if openldap support is true
  ansible.builtin.set_fact:
    openldap_support: "{{ software_config.softwares | selectattr('name', 'equalto', 'openldap') | list | length > 0 }}"

- name: Initialise ucx support variables
  ansible.builtin.set_fact:
    ucx_support: false

- name: Check if ucx support is true
  ansible.builtin.set_fact:
    ucx_support: "{{ software_config.softwares | selectattr('name', 'equalto', 'ucx') | list | length > 0 }}"

- name: Initialise openmpi support variables
  ansible.builtin.set_fact:
    openmpi_support: false

- name: Check if openmpi support is true
  ansible.builtin.set_fact:
    openmpi_support: "{{ software_config.softwares | selectattr('name', 'equalto', 'openmpi') | list | length > 0 }}"

- name: Initialise ldms support variables
  ansible.builtin.set_fact:
    ldms_support: false

- name: Check if ldms support is true
  ansible.builtin.set_fact:
    ldms_support: "{{ software_config.softwares | selectattr('name', 'in', 'ldms') | list | length > 0 }}"


================================================
FILE: discovery/roles/discovery_validations/tasks/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Set_fact for omnia_config_credentials.yml variables
  ansible.builtin.set_fact:
    provision_password: "{{ hostvars['localhost']['provision_password'] }}"
    bmc_username: "{{ hostvars['localhost']['bmc_username'] }}"
    bmc_password: "{{ hostvars['localhost']['bmc_password'] }}"
  no_log: true

- name: Load OIM metadata
  ansible.builtin.set_fact:
    oim_metadata: "{{ lookup('file', oim_metadata_file_path) | from_yaml }}"

- name: Set upgrade_enabled flag from metadata
  ansible.builtin.set_fact:
    upgrade_enabled: false

- name: Set upgrade_enabled flag from metadata
  ansible.builtin.set_fact:
    upgrade_enabled: true
  when:
    - oim_metadata.upgrade_backup_dir is defined
    - oim_metadata.upgrade_backup_dir | length > 0

- name: Include discovery inputs
  ansible.builtin.include_tasks: include_inputs.yml
  with_items: "{{ discovery_inputs }}"

- name: Include software config
  ansible.builtin.include_tasks: include_software_config.yml

- name: Check if discovery mechanism is mapping
  ansible.builtin.include_tasks: validate_mapping_mechanism.yml

- name: Validate mapping file
  ansible.builtin.include_tasks: validate_mapping_file.yml
  when: mapping_file_status

- name: Update hosts file
  ansible.builtin.include_tasks: update_hosts.yml

- name: Validate telemetry config
  ansible.builtin.include_tasks: validate_telemetry_config.yml
  when:
    - idrac_telemetry_support | lower == 'true' | default('false') or
      ldms_support | default('false')


================================================
FILE: discovery/roles/discovery_validations/tasks/update_hosts.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Ensure 127.0.0.1 localhost entry exists
  ansible.builtin.shell: |
    set -o pipefail
    grep -qxF '127.0.0.1 localhost.localdomain localhost' {{ hosts_file_path }} || echo '127.0.0.1 localhost.localdomain localhost' >> {{ hosts_file_path }}
  changed_when: true

- name: Remove stale entries for IPs and hostnames that are being updated
  ansible.builtin.shell: |
    set -o pipefail
    grep -v '^{{ item.value.ADMIN_IP }}\s' {{ hosts_file_path }} | \
    grep -v '\s{{ item.value.HOSTNAME }}$' > {{ hosts_file_path }}.tmp
    cat {{ hosts_file_path }}.tmp > {{ hosts_file_path }}
    rm -f {{ hosts_file_path }}.tmp
  changed_when: true
  loop: "{{ read_mapping_file.dict | dict2items }}"

- name: Add hosts file entry for cluster
  ansible.builtin.shell: |
    set -o pipefail
    echo '{{ item.value.ADMIN_IP }} {{ item.value.HOSTNAME }}' >> {{ hosts_file_path }}
  changed_when: true
  loop: "{{ read_mapping_file.dict | dict2items }}"


================================================
FILE: discovery/roles/discovery_validations/tasks/validate_image.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Set the functional_group_name
  ansible.builtin.set_fact:
    functional_group_name: "{{ item }}"

- name: Normalize build stream inputs
  ansible.builtin.set_fact:
    enable_build_stream: "{{ enable_build_stream | default(hostvars['localhost']['enable_build_stream'] | default(false)) }}"
    build_stream_job_id: "{{ build_stream_job_id | default(hostvars['localhost']['build_stream_job_id'] | default('')) }}"
    compute_image_suffix: "{{ compute_image_suffix | default(hostvars['localhost']['compute_image_suffix'] | default('')) }}"
- name: Verify image, kernel and initramfs in S3
  ansible.builtin.shell: |
    set -o pipefail && \
    s3cmd ls -Hr s3://boot-images | \
    grep {{ functional_group_name }}{% if enable_build_stream and (compute_image_suffix | default('') != '') %}_{{ compute_image_suffix }}{% endif %} | \
    grep {{ hostvars['localhost']['cluster_os_version'] }} | awk '{print $4}' | sed 's|s3://||'
  changed_when: false
  failed_when: false
  register: verify_s3_image

- name: Verify s3 image output
  ansible.builtin.debug:
    msg: "{{ verify_s3_image.stdout_lines }}"
    verbosity: 2

- name: Initialize kernel and initrd
  ansible.builtin.set_fact:
    kernel: ""
    initrd: ""

- name: Set kernel and initrd variables
  ansible.builtin.set_fact:
    kernel: "{{ verify_s3_image.stdout_lines | select('search', 'vmlinuz') | list | first }}"
    initrd: "{{ verify_s3_image.stdout_lines | select('search', 'initramfs') | list | first }}"
  when: verify_s3_image.stdout_lines | length > 1

- name: Fail if kernel or initrd length less than 1
  ansible.builtin.fail:
    msg: "{{ image_missing_fail_msg.splitlines() | join(' ') }}"
  when: kernel | length < 1 or initrd | length < 1


================================================
FILE: discovery/roles/discovery_validations/tasks/validate_mapping_file.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Delete temp_mapping_file
  ansible.builtin.file:
    path: "{{ temp_pxe_file_path }}"
    state: absent

- name: Remove leading/trailing spaces and tabs from the mapping file (but preserve column structure)
  ansible.builtin.shell: |
    set -o pipefail && \
    sed 's/^[[:space:]]*//g' "{{ pxe_mapping_file_path }}" | sed 's/[[:space:]]*$//g' > "{{ temp_pxe_file_path }}"
  changed_when: false
  failed_when: false

- name: Find and Replace
  ansible.builtin.lineinfile:
    path: "{{ temp_pxe_file_path }}"
    regexp: '\s*#'
    state: absent

- name: Read mapping file
  ansible.builtin.slurp:
    path: "{{ temp_pxe_file_path }}"
  register: mapping_file_raw

- name: Replace only the first occurrence (Jinja split+join)
  ansible.builtin.set_fact:
    modified_mapping_file: >-
      {{
        (mapping_file_raw.content | b64decode)
        .split('service_kube_control_plane_x86_64', 1)
        | join('service_kube_control_plane_first_x86_64')
      }}

- name: Write updated mapping file back to disk
  ansible.builtin.copy:
    content: "{{ modified_mapping_file }}"
    dest: "{{ temp_pxe_file_path }}"
    mode: "0644"

- name: Generate xnames in temporary mapping file
  generate_xname_in_mapping_file:
    mapping_file_path: "{{ temp_pxe_file_path }}"

- name: Read host mapping file from CSV file and return a dictionary
  community.general.read_csv:
    path: "{{ temp_pxe_file_path }}"
    key: "{{ mapping_file_key }}"
  register: read_mapping_file

- name: Initialize count variables
  ansible.builtin.set_fact:
    list_of_hostnames: []
    count_total_items: "{{ read_mapping_file.dict | length }}"

- name: Create list of hostnames defined in mapping file
  ansible.builtin.set_fact:
    list_of_hostnames: "{{ [item.value.HOSTNAME] + list_of_hostnames }}"
  loop: "{{ read_mapping_file.dict | dict2items }}"
  loop_control:
    label: "{{ item.value.ADMIN_MAC }}"

- name: Assert hostnames
  ansible.builtin.assert:
    that:
      - '"_" not in item'
      - '"." not in item'
      - '" " not in item'
    quiet: true
    fail_msg: "{{ hostname_chars_fail_msg + item }}"
  with_items: "{{ list_of_hostnames }}"

- name: Validate capital case in hostname
  ansible.builtin.assert:
    that: item is regex(("^(([a-z]|[a-z][a-z0-9\-]*[a-z0-9])\.)*([a-z]|[a-z][a-z0-9\-]*[a-z0-9])$"))
    fail_msg: "{{ capital_hostname_fail_msg }}"
  with_items: "{{ list_of_hostnames }}"


================================================
FILE: discovery/roles/discovery_validations/tasks/validate_mapping_mechanism.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Initialize variable
  ansible.builtin.set_fact:
    discovery_mech_mapping: false
    mapping_file_status: false

- name: Check that the pxe mapping file path exists
  ansible.builtin.stat:
    path: "{{ pxe_mapping_file_path }}"
  register: pxe_stat_result

- name: Fail if pxe mapping file path does not exist
  ansible.builtin.fail:
    msg: "{{ invalid_mapping_fail_msg }}"
  when: not pxe_stat_result.stat.exists

- name: Set discovery_mech_mapping to true
  ansible.builtin.set_fact:
    mapping_file_status: true
  when: pxe_stat_result.stat.exists


================================================
FILE: discovery/roles/discovery_validations/tasks/validate_oim_timezone.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Get current OIM timezone
  ansible.builtin.command: >
    timedatectl show -p Timezone --value
  register: current_oim_tz_cmd
  changed_when: false
  failed_when: false

- name: Read OIM metadata file
  ansible.builtin.slurp:
    path: "{{ oim_metadata_file_path }}"
  register: oim_metadata_raw
  failed_when: false

- name: Parse OIM metadata YAML
  ansible.builtin.set_fact:
    oim_metadata: >-
      {{ (oim_metadata_raw.content | default('') | b64decode | from_yaml)
         if oim_metadata_raw is defined and oim_metadata_raw.content is defined
         else {} }}

- name: Extract stored and current OIM timezone
  ansible.builtin.set_fact:
    stored_oim_timezone: "{{ oim_metadata.oim_timezone | default('') }}"
    current_oim_timezone: "{{ current_oim_tz_cmd.stdout | default('') }}"

- name: Handle OIM timezone change
  when:
    - stored_oim_timezone | length > 0
    - current_oim_timezone | length > 0
    - (stored_oim_timezone | trim | lower)
      != (current_oim_timezone | trim | lower)
  block:
    - name: Warn if OIM timezone changed after omnia_core deployment
      ansible.builtin.pause:
        seconds: "{{ pause_time_15 }}"
        prompt: "{{ oim_timezone_changed_warning_msg }}"

    - name: Update OIM metadata timezone if changed
      ansible.builtin.lineinfile:
        path: "{{ oim_metadata_file_path }}"
        regexp: '^oim_timezone:'
        line: "oim_timezone: {{ current_oim_timezone | trim }}"
        create: false

- name: Update OIM metadata vars
  ansible.builtin.include_vars: "{{ oim_metadata_file_path }}"
  register: include_oim_metadata
  no_log: true


================================================
FILE: discovery/roles/discovery_validations/tasks/validate_openldap_container.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
- name: Validate OpenLDAP container is running
  block:
    - name: Check if OpenLDAP container exists and is running
      containers.podman.podman_container_info:
        name: omnia_auth
      register: openldap_container_check
      failed_when: false
    - name: Set OpenLDAP container status
      ansible.builtin.set_fact:
        openldap_container_missing: >-
          {{ (openldap_container_check.containers | default([]) | length == 0) or
             (openldap_container_check.containers | default([]) | length > 0 and
              openldap_container_check.containers[0].State.Status != 'running') }}

    - name: Display OpenLDAP container error
      ansible.builtin.pause:
        prompt: "{{ openldap_container_missing_msg }}"
        seconds: 1
      when: openldap_container_missing | bool

    - name: Fail if OpenLDAP container is not running
      ansible.builtin.fail:
        msg: "OpenLDAP container is not running. See error details above."
      when: openldap_container_missing | bool


================================================
FILE: discovery/roles/discovery_validations/tasks/validate_telemetry_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Set support values
  ansible.builtin.set_fact:
    idrac_telemetry_support: "{{ idrac_telemetry_support | lower }}"

- name: Warning for idrac_telemetry_support is currently set to false
  ansible.builtin.pause:
    seconds: "{{ pause_time_15 }}"
    prompt: "{{ warning_idrac_telemetry_support_false }}"
  when: not idrac_telemetry_support

- name: Warning for idrac_telemetry_support is currently set to true
  ansible.builtin.pause:
    seconds: "{{ pause_time_15 }}"
    prompt: "{{ warning_idrac_telemetry_support_true }}"
  when: idrac_telemetry_support

- name: Get k8s cluster details
  ansible.builtin.set_fact:
    service_cluster_info: >-
      {{ vars[k8s_cluster_name]
          | selectattr('deployment', 'equalto', true)
          | list
          | first }}
  vars:
    k8s_cluster_name: "service_k8s_cluster"

- name: Set cluster configuration facts
  ansible.builtin.set_fact:
    k8s_nfs_storage_name: "{{ service_cluster_info.nfs_storage_name }}"

- name: Find matching NFS client param
  ansible.builtin.set_fact:
    k8s_nfs_storage_details: "{{ (nfs_client_params | selectattr('nfs_name', 'equalto', k8s_nfs_storage_name) | list | first) | default({}) }}"

- name: Set share_path from service_k8s_cluster client_share_path
  ansible.builtin.set_fact:
    k8s_client_share_path: "{{ k8s_nfs_storage_details.client_share_path }}"
    k8s_server_share_path: "{{ k8s_nfs_storage_details.server_share_path }}"
    k8s_server_ip: "{{ k8s_nfs_storage_details.server_ip }}"
    k8s_mount_options: "{{ k8s_nfs_storage_details.client_mount_options }}"


================================================
FILE: discovery/roles/discovery_validations/vars/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# Usage: include_inputs.yml
discovery_inputs:
  - path: "{{ hostvars['localhost']['input_project_dir'] }}/provision_config.yml"
  - path: "{{ hostvars['localhost']['input_project_dir'] }}/network_spec.yml"
  - path: "{{ hostvars['localhost']['functional_groups_config_path'] }}"
  - path: "/opt/omnia/.data/oim_metadata.yml"
  - path: "{{ hostvars['localhost']['input_project_dir'] }}/security_config.yml"
  - path: "{{ hostvars['localhost']['input_project_dir'] }}/telemetry_config.yml"
  - path: "{{ hostvars['localhost']['input_project_dir'] }}/storage_config.yml"
  - path: "{{ hostvars['localhost']['input_project_dir'] }}/omnia_config.yml"
  - path: "{{ hostvars['localhost']['input_project_dir'] }}/build_stream_config.yml"
build_stream_job_id_absent: |
    Build Stream mode is enabled. Manual execution is not supported.
    Please trigger this workflow via the GitLab pipeline.
input_syntax_fail_msg: "Failed. Syntax errors present in {{ item.path }}. Fix errors and re-run playbook again."  # noqa: yaml[line-length]

# Usage: include_software_config.yml
software_config_file: "{{ hostvars['localhost']['input_project_dir'] }}/software_config.json"
software_config_syntax_fail_msg: "Failed. Syntax errors present in software_config.json. Fix errors and re-run playbook again."  # noqa: yaml[line-length]

# Usage: validate_mapping_mechanism.yml
invalid_mapping_fail_msg: |
  "Failed. pxe_mapping_file_path should be a valid path in provision_config.yml.
  Please provide valid path and re-run the playbook.

# Usage: validate_mapping_file.yml
mapping_file_key: "ADMIN_MAC"
hostname_chars_fail_msg: |
  Failed. Hostname should not contain _ or . or space or node- as it might result in issues with provisioning/authentication
  tools like FreeIPA. Make sure the mapping file contains only the hostname, and not the domain_name. Found in:
temp_mapping_file_path: "/opt/omnia/pxe_mapping_file.csv"
capital_hostname_fail_msg: |
  "Failed. Invalid hostname {{ item }}. Hostname should be in lower case and should not start with numbers.
  Refer documentation for more details."
temp_pxe_file_path: "/opt/omnia/openchami/temp_pxe_file.csv"
file_mode: "0644"
functional_groups_file_path: "{{ hostvars['localhost']['functional_groups_config_path'] }}"

# Usage: updates_hosts.yml
hosts_file_path: /opt/omnia/hosts

# Usage: validate_image.yml
image_missing_fail_msg: |
  Error: Image not found for functional group {{ functional_group_name }}.
  Please create the image by running the corresponding build playbook (build_image_x86_64.yml for x86_64 or build_image_aarch64.yml for aarch64)
  and re-run the discovery.yml playbook.

# Usage: validate_telemetry.yml
warning_idrac_telemetry_support_false: |
  "[WARNING] idrac_telemetry_support is set to false in telemetry_config.yml. This means iDRAC telemetry will not be activated.
  To use telemetry, set idrac_telemetry_support to true in telemetry_config.yml."

warning_idrac_telemetry_support_true: |
  "[WARNING] idrac_telemetry_support is set to true in telemetry_config.yml.
  iDRAC telemetry will be activated for all BMC IPs listed in mapping file.
  Confirm that all BMC IPs are reachable from the respective service cluster nodes for telemetry to function properly.
  Make sure that Redfish is enabled and the iDRAC has a datacenter license.
  Also, ensure that the firmware version is greater than 4 for iDRAC9 or greater than 1 for iDRAC10."
pause_time_15: 15
bmc_group_data_filename: "/opt/omnia/telemetry/bmc_group_data.csv"

# Usage: validate_oim_timezone.yml
oim_timezone_changed_warning_msg: |
  WARNING: OIM timezone has changed from '{{ stored_oim_timezone }}' to '{{ current_oim_timezone }}'
  after omnia_core container was deployed. Omnia will now proceed using the UPDATED timezone value
  and update the metadata accordingly. If this change was not intentional, please revert the
  OIM host timezone back to the original value, else REPROVISION THE ENTIRE CLUSTER to avoid
  inconsistent behavior.

oim_metadata_file_path: "/opt/omnia/.data/oim_metadata.yml"

# Usage: validate_openldap_container.yml
openldap_container_missing_msg: "{{ '\x1b[31m' }}\
  ==================================================================================\n\
  ERROR: OpenLDAP container is not running.\n\
  ==================================================================================\n\
  \n\
  OpenLDAP support is enabled but the OpenLDAP container was not found.\n\
  This typically happens when prepare_oim.yml was run without the OpenLDAP\n\
  package in software_config.json.\n\
  \n\
  To resolve this issue:\n\
  1. Ensure the 'openldap' package is added to software_config.json\n\
  2. Re-run prepare_oim.yml to start the OpenLDAP container and generate certificates\n\
  3. Run local_repo.yml to download OpenLDAP packages\n\
  4. Then re-run discovery.yml\n\
  \n\
  For more information, refer to the Omnia documentation on OpenLDAP configuration.\n\
  ==================================================================================\
  {{ '\x1b[0m' }}"


================================================
FILE: discovery/roles/k8s_config/README.md
================================================
# K8s Config Role

## Overview
Creates Kubernetes configuration files for the service cluster and stores them in NFS-shared storage.

## Purpose
- Generates Kubernetes manifests for cluster services
- Creates Helm chart values files
- Prepares ConfigMaps and Secrets for deployments
- Stores configurations in NFS for service cluster access

## Key Tasks
- **Create Config Directory**: Creates NFS directory structure for K8s configurations
- **Generate Manifests**: Creates Namespaces, RBAC, ConfigMaps, Secrets, Services, Deployments
- **Create Helm Values**: Generates Helm chart values files for services
- **Set Permissions**: Sets appropriate file permissions and ownership


================================================
FILE: discovery/roles/k8s_config/files/empty_certificate_template.yml
================================================
apiVersion: v1
kind: Secret
metadata:
  name: isilon-certs-0
  namespace: isilon
type: Opaque
data:
  cert-0: ""


================================================
FILE: discovery/roles/k8s_config/tasks/create_k8s_config_nfs.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
- name: Include variable file omnia_config.yml
  ansible.builtin.include_vars: "{{ input_project_dir }}/omnia_config.yml"

- name: Include storage vars
  ansible.builtin.include_vars: "{{ input_project_dir }}/storage_config.yml"

- name: Include include_high_availability_config vars
  ansible.builtin.include_vars: "{{ ha_config_file }}"

- name: Set facts for service_k8s
  ansible.builtin.set_fact:
    cluster_name: "{{ service_k8s_cluster[0].cluster_name }}"
    k8s_cni: "{{ service_k8s_cluster[0].k8s_cni }}"
    pod_external_ip_range: "{{ service_k8s_cluster[0].pod_external_ip_range }}"
    k8s_service_addresses: "{{ service_k8s_cluster[0].k8s_service_addresses }}"
    k8s_pod_network_cidr: "{{ service_k8s_cluster[0].k8s_pod_network_cidr }}"
    csi_powerscale_driver_secret_file_path: "{{ service_k8s_cluster[0].csi_powerscale_driver_secret_file_path }}"
    csi_powerscale_driver_values_file_path: "{{ service_k8s_cluster[0].csi_powerscale_driver_values_file_path }}"
    nfs_storage_name: "{{ service_k8s_cluster[0].nfs_storage_name }}"
    k8s_crio_storage_size: "{{ service_k8s_cluster[0].k8s_crio_storage_size }}"

- name: Read the service_k8s mount point
  ansible.builtin.set_fact:
    k8s_client_mount_path: "{{ (nfs_client_params | selectattr('nfs_name', 'equalto', nfs_storage_name) | first).client_share_path }}"
    k8s_nfs_server_ip: "{{ (nfs_client_params | selectattr('nfs_name', 'equalto', nfs_storage_name) | first).server_ip }}"
    k8s_server_share_path: "{{ (nfs_client_params | selectattr('nfs_name', 'equalto', nfs_storage_name) | first).server_share_path }}"

- name: Ensure SSH key directory exists on K8s share
  ansible.builtin.file:
    path: "{{ k8s_client_mount_path }}/ssh"
    state: directory
    owner: root
    group: root
    mode: '0700'

- name: Copy OIM private key to K8s share for node-to-node SSH
  ansible.builtin.copy:
    src: "{{ ssh_private_key_path }}"
    dest: "{{ k8s_client_mount_path }}/ssh/oim_rsa"
    owner: root
    group: root
    mode: '0600'

- name: Set admin network nic and ip
  ansible.builtin.set_fact:
    admin_nic_ip: "{{ hostvars['localhost']['admin_nic_ip'] }}"
    admin_netmask_bits: "{{ hostvars['localhost']['admin_netmask_bits'] }}"

- name: Set admin network CIDR
  ansible.builtin.set_fact:
    admin_nic_cidr: "{{ (admin_nic_ip + '/' + admin_netmask_bits) | ansible.utils.ipaddr('network/prefix') }}"

- name: Fetch server_ip and server_share_path from list when nfs sever is localhost
  ansible.builtin.set_fact:
    nfs_server_ip: "{{ hostvars['127.0.0.1']['admin_nic_ip'] }}"
  when: k8s_nfs_server_ip == "localhost"

- name: Set HA-related facts
  ansible.builtin.set_fact:
    enable_k8s_ha: "{{ service_k8s_cluster_ha[0].enable_k8s_ha | default(false) }}"
    kube_vip: "{{ service_k8s_cluster_ha[0].virtual_ip_address | default('') }}"

- name: Set fact for pulp mirror
  ansible.builtin.set_fact:
    pulp_mirror: "{{ hostvars['localhost']['admin_nic_ip'] }}:2225"

- name: Set fact for dns, csi driver support and service_k8s_version
  ansible.builtin.set_fact:
    dns: "{{ hostvars['localhost']['dns'] }}"
    csi_driver_powerscale_support: "{{ hostvars['localhost']['csi_driver_powerscale_support'] | string | lower }}"
    service_k8s_version: "{{ hostvars['localhost']['service_k8s_version'] }}"

- name: Create required share directories on NFS
  block:
    - name: Create subdirectories on NFS share
      ansible.builtin.file:
        path: "{{ k8s_client_mount_path }}/{{ item }}"
        state: directory
        mode: "{{ folder_mode }}"
        owner: root
        group: root
      loop:
        - calico
        - metallb
        # - multus
        - nfs-client-provisioner
        - helm
        # - whereabouts

    - name: Create subdirectories on NFS share
      ansible.builtin.file:
        path: "{{ k8s_client_mount_path }}/{{ item }}"
        state: directory
        mode: "{{ folder_mode }}"
        owner: root
        group: root
      loop:
        - csi-driver-powerscale
      when: hostvars['localhost']['csi_driver_powerscale_support']

  rescue:
    - name: Fail with NFS export advice
      ansible.builtin.fail:
        msg: "{{ nfs_export_help_msg }}"

- name: Creating the persist folders in nfs share
  ansible.builtin.include_tasks: create_node_dir.yml

# additional packages
- name: Create x86_64 package base directory
  ansible.builtin.file:
    path: "{{ packages_base_dir_x86_64 }}"
    state: directory
    mode: '{{ common_mode }}'

- name: Create aarch64 package base directory
  ansible.builtin.file:
    path: "{{ packages_base_dir_aarch64 }}"
    state: directory
    mode: '{{ common_mode }}'

- name: Create x86_64 package layout directories
  ansible.builtin.file:
    path: "{{ packages_base_dir_x86_64 }}/{{ item }}"
    state: directory
    mode: '{{ common_mode }}'
  loop: "{{ packages_layout_x86_64 }}"

- name: Create aarch64 package layout directories
  ansible.builtin.file:
    path: "{{ packages_base_dir_aarch64 }}/{{ item }}"
    state: directory
    mode: '{{ common_mode }}'
  loop: "{{ packages_layout_aarch64 }}"

- name: Print copy paths for x86_64
  ansible.builtin.debug:
    msg: "{{ print_copy_msg }}"
  loop: "{{ offline_path_x86_64 | default([]) }}"

- name: Print copy paths for aarch64
  ansible.builtin.debug:
    msg: "{{ print_copy_msg }}"
  loop: "{{ offline_path_aarch64 | default([]) }}"

- name: Check x86_64 offline package sources
  ansible.builtin.stat:
    path: "{{ item.source_path }}"
  loop: "{{ offline_path_x86_64 | default([]) }}"
  register: x86_64_offline_pkg_sources

- name: Check aarch64 offline package sources
  ansible.builtin.stat:
    path: "{{ item.source_path }}"
  loop: "{{ offline_path_aarch64 | default([]) }}"
  register: aarch64_offline_pkg_sources

- name: Copy x86_64 offline packages
  ansible.builtin.copy:
    src: "{{ item.item.source_path }}/"
    dest: "{{ item.item.dest_path }}/"
    remote_src: true
    mode: preserve
  loop: "{{ x86_64_offline_pkg_sources.results | default([]) }}"
  when:
    - item.stat.exists
    - item.item.source_path | length > 0
    - item.item.dest_path | length > 0

- name: Copy aarch64 offline packages
  ansible.builtin.copy:
    src: "{{ item.item.source_path }}/"
    dest: "{{ item.item.dest_path }}/"
    remote_src: true
    mode: preserve
  loop: "{{ aarch64_offline_pkg_sources.results | default([]) }}"
  when:
    - item.stat.exists
    - item.item.source_path | length > 0
    - item.item.dest_path | length > 0

- name: Include local repo access variable file
  ansible.builtin.include_vars: "{{ local_repo_access_config_file }}"

- name: Load service_k8s.json
  ansible.builtin.set_fact:
    k8s_packages_json: "{{ lookup('file', k8s_packages_file) | from_json }}"

- name: Extract and set facts for tarball URLs
  ansible.builtin.set_fact:
    calico_package: "{{ k8s_packages_json['service_kube_control_plane_first']['cluster'] | selectattr('type', 'equalto', 'manifest') | selectattr('package', 'search', 'calico') | map(attribute='package') | join }}" # noqa: yaml[line-length]
    metallb_package: "{{ k8s_packages_json['service_kube_control_plane_first']['cluster'] | selectattr('type', 'equalto', 'manifest') | selectattr('package', 'search', 'metallb-native') | map(attribute='package') | join }}" # noqa: yaml[line-length]
    multus_package: "{{ k8s_packages_json['service_kube_control_plane_first']['cluster'] | selectattr('type', 'equalto', 'manifest') | selectattr('package', 'search', 'multus-daemonset-thick') | map(attribute='package') | join }}" # noqa: yaml[line-length]
    helm_package: "{{ k8s_packages_json['service_kube_control_plane_first']['cluster'] | selectattr('type', 'equalto', 'tarball') | selectattr('package', 'search', 'helm') | map(attribute='package') | join }}" # noqa: yaml[line-length]
    nfs_subdir_external_provisioner_pkg: "{{ k8s_packages_json['service_kube_control_plane_first']['cluster'] | selectattr('type', 'equalto', 'tarball') | selectattr('package', 'search', 'nfs-subdir-external-provisioner') | map(attribute='package') | join }}" # noqa: yaml[line-length]
    whereabouts_pkg: "{{ k8s_packages_json['service_kube_control_plane_first']['cluster'] | selectattr('type', 'equalto', 'git') | selectattr('package', 'search', 'whereabouts') | map(attribute='package') | join }}" # noqa: yaml[line-length]

- name: Copy pulp webserver certificate to target host
  ansible.builtin.copy:
    src: "{{ pulp_webserver_cert_path }}"
    dest: "{{ anchors_path }}"
    mode: "{{ file_mode }}"
  become: true

- name: Update CA trust on target host
  ansible.builtin.command: update-ca-trust
  register: update_ca
  changed_when: false

# Calico
- name: Download Calico manifest
  ansible.builtin.get_url:
    url: "{{ calico_manifest_yaml_url }}"
    dest: "{{ k8s_client_mount_path }}/calico/{{ calico_package }}.yml"
    mode: "{{ file_mode }}"

# metallb
- name: Download metallb-native manifest
  ansible.builtin.get_url:
    url: "{{ metallb_manifest_yaml_url }}"
    dest: "{{ k8s_client_mount_path }}/metallb/{{ metallb_package }}.yml"
    mode: "{{ file_mode }}"

# multus
# - name: Download multus manifest
#   ansible.builtin.get_url:
#     url: "{{ multus_manifest_yaml_url }}"
#     dest: "{{ k8s_client_mount_path }}/multus/{{ multus_package }}.yml"
#     mode: "{{ file_mode }}"

# helm
- name: Download helm tarball
  ansible.builtin.get_url:
    url: "{{ helm_tarball_url }}"
    dest: "{{ k8s_client_mount_path }}/helm/{{ helm_package }}.tar.gz"
    mode: "{{ file_mode }}"

- name: Untar helm tarball repo
  ansible.builtin.unarchive:
    src: "{{ k8s_client_mount_path }}/helm/{{ helm_package }}.tar.gz"
    dest: "{{ k8s_client_mount_path }}/helm/"
    remote_src: true

# nfs client provisioner
- name: Download nfs-client-provisioner tarball
  ansible.builtin.get_url:
    url: "{{ nfs_client_provisioner_tarball_url }}"
    dest: "{{ k8s_client_mount_path }}/nfs-client-provisioner/{{ nfs_subdir_external_provisioner_pkg }}.tar.gz"
    mode: "{{ file_mode }}"

# whereabouts
# - name: Get whereabouts plugin git folder
#   ansible.builtin.get_url:
#     url: "{{ whereabouts_git_url }}"
#     dest: "{{ k8s_client_mount_path }}/whereabouts/{{ whereabouts_pkg }}.tar.gz"
#     mode: "{{ file_mode }}"

# - name: Unarchive whereabouts git folder
#   ansible.builtin.unarchive:
#     src: "{{ k8s_client_mount_path }}/whereabouts/{{ whereabouts_pkg }}.tar.gz"
#     dest: "{{ k8s_client_mount_path }}/whereabouts"
#     mode: "{{ file_mode }}"
#     remote_src: true

- name: Copy pulp webserver certificate to client_share_path
  ansible.builtin.copy:
    src: "{{ pulp_webserver_cert_path }}"
    dest: "{{ k8s_client_mount_path }}"
    mode: "{{ file_mode }}"
  become: true

- name: Include PowerScale CSI dependency tasks
  ansible.builtin.include_tasks: get_powerscale_dependencies.yml
  when: hostvars['localhost']['csi_driver_powerscale_support'] | bool


================================================
FILE: discovery/roles/k8s_config/tasks/create_node_dir.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries.
# All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Slurp nodes.yaml
  ansible.builtin.slurp:
    src: "{{ nodes_yaml }}"
  register: slurped_yaml

- name: Parse nodes.yaml into a variable
  ansible.builtin.set_fact:
    parsed_yaml: "{{ slurped_yaml.content | b64decode | from_yaml }}"

- name: Extract service_kube_control_plane_first_x86_64 IPs
  ansible.builtin.set_fact:
    cp_first_ip_list: >-
      {{
        parsed_yaml.nodes
        | selectattr('group', 'equalto', 'service_kube_control_plane_first_x86_64')
        | map(attribute='interfaces') | map('first')
        | map(attribute='ip_addrs')   | map('first')
        | map(attribute='ip_addr')
        | list
      }}

- name: Extract service_kube_control_plane_x86_64 IPs
  ansible.builtin.set_fact:
    cp_ip_list: >-
      {{
        parsed_yaml.nodes
        | selectattr('group', 'equalto', 'service_kube_control_plane_x86_64')
        | map(attribute='interfaces') | map('first')
        | map(attribute='ip_addrs')   | map('first')
        | map(attribute='ip_addr')
        | list
      }}

- name: Extract service_kube_node_x86_64 IPs
  ansible.builtin.set_fact:
    worker_ip_list: >-
      {{
        parsed_yaml.nodes
        | selectattr('group', 'equalto', 'service_kube_node_x86_64')
        | map(attribute='interfaces') | map('first')
        | map(attribute='ip_addrs')   | map('first')
        | map(attribute='ip_addr')
        | list
      }}

- name: Create persistent folders for control-plane nodes (etcd, kubernetes, kubelet)
  block:
    - name: Create control-plane node folders
      ansible.builtin.file:
        path: "{{ k8s_client_mount_path }}/{{ item.0 }}/{{ item.1 }}"
        state: directory
        mode: "{{ folder_mode }}"
        owner: root
        group: root
      loop: "{{ cp_ips | product(cp_components) | list }}"
      loop_control:
        label: "{{ item.0 }}/{{ item.1 }}"
  rescue:
    - name: Fail with NFS export advice
      ansible.builtin.fail:
        msg: "{{ nfs_export_help_msg }}"

- name: Create persistent folders for worker nodes (kubernetes, kubelet)
  block:
    - name: Create worker node folders
      ansible.builtin.file:
        path: "{{ k8s_client_mount_path }}/{{ item.0 }}/{{ item.1 }}"
        state: directory
        mode: "{{ folder_mode }}"
        owner: root
        group: root
      loop: "{{ worker_ips | product(worker_components) | list }}"
      loop_control:
        label: "{{ item.0 }}/{{ item.1 }}"
  rescue:
    - name: Fail with NFS export advice
      ansible.builtin.fail:
        msg: "{{ nfs_export_help_msg }}"


================================================
FILE: discovery/roles/k8s_config/tasks/get_powerscale_dependencies.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries.
# All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

---

- name: Get CSI dependencies from local repo
  when: hostvars['localhost']['csi_driver_powerscale_support']
  block:
    - name: Base64 encode username and password
      ansible.builtin.set_fact:
        csi_username_b64: "{{ hostvars['localhost']['csi_username'] | b64encode }}"
        csi_password_b64: "{{ hostvars['localhost']['csi_password'] | b64encode }}"
      no_log: true

    - name: Check if csi_powerscale_secret_vault exists
      ansible.builtin.stat:
        path: "{{ input_project_dir }}/{{ csi_powerscale_secret_vaultname }}"
      register: vault_key_result
      delegate_to: localhost

    - name: Create ansible vault key if it does not exist
      ansible.builtin.set_fact:
        vault_key: "{{ lookup('password', '/dev/null chars=ascii_letters') }}"
      when: not vault_key_result.stat.exists
      delegate_to: localhost

    - name: Save vault key
      ansible.builtin.lineinfile:
        path: "{{ input_project_dir }}/{{ csi_powerscale_secret_vaultname }}"
        line: "{{ vault_key }}"
        mode: "{{ vault_key_permission }}"
        owner: root
        create: true
      when: not vault_key_result.stat.exists
      delegate_to: localhost

    - name: Check if secret file is encrypted
      ansible.builtin.command: cat "{{ csi_powerscale_driver_secret_file_path }}"
      changed_when: false
      register: config_content
      delegate_to: localhost

    - name: Encrypt secret file
      ansible.builtin.command: >-
        ansible-vault encrypt {{ csi_powerscale_driver_secret_file_path }}
        --vault-password-file {{ input_project_dir }}/{{ csi_powerscale_secret_vaultname }}
      when: "'$ANSIBLE_VAULT;' not in config_content.stdout"
      changed_when: false
      delegate_to: localhost

    - name: Check if secret file is encrypted
      ansible.builtin.command: cat "{{ csi_powerscale_driver_secret_file_path }}"
      changed_when: false
      register: config_content
      delegate_to: localhost

    - name: Decrpyt secret file
      ansible.builtin.command: >-
        ansible-vault decrypt {{ csi_powerscale_driver_secret_file_path }}
        --vault-password-file {{ input_project_dir }}/{{ csi_powerscale_secret_vaultname }}
      when: "'$ANSIBLE_VAULT;' in config_content.stdout"
      delegate_to: localhost
      changed_when: false

    - name: Update username in secret.yaml with encoded value
      ansible.builtin.replace:
        path: "{{ csi_powerscale_driver_secret_file_path }}"
        regexp: '^(\s*)username:\s*(?!#).*'
        replace: '\1username: {{ csi_username_b64 }}'
      no_log: true
      delegate_to: localhost

    - name: Update password in secret.yaml with encoded value
      ansible.builtin.replace:
        path: "{{ csi_powerscale_driver_secret_file_path }}"
        regexp: '^(\s*)password:\s*(?!#).*'
        replace: '\1password: {{ csi_password_b64 }}'
      no_log: true
      delegate_to: localhost

    - name: Load PowerScale CSI secret file
      ansible.builtin.include_vars:
        file: "{{ csi_powerscale_driver_secret_file_path }}"
        name: clusters
      no_log: true
      when:
        - csi_powerscale_driver_secret_file_path is defined
      delegate_to: localhost

    - name: Load values.yaml file
      ansible.builtin.include_vars:
        file: "{{ csi_powerscale_driver_values_file_path }}"
        name: csi_powerscale_values_file
      delegate_to: localhost

    - name: Get csi-powerscale git tar
      ansible.builtin.get_url:
        url: "{{ offline_git_path }}/csi-powerscale/{{ csi_powerscale_git }}"
        dest: "{{ k8s_client_mount_path }}/csi-driver-powerscale/{{ csi_powerscale_git }}"
        mode: "{{ permission_644 }}"

    - name: Extract csi-powerscale tar file
      ansible.builtin.unarchive:
        src: "{{ k8s_client_mount_path }}/csi-driver-powerscale/{{ csi_powerscale_git }}"
        dest: "{{ k8s_client_mount_path }}/csi-driver-powerscale/"
        remote_src: true

    - name: Get dell/helm-charts git tar
      ansible.builtin.get_url:
        url: "{{ offline_git_path }}/helm-charts/{{ helm_charts_git }}"
        dest: "{{ k8s_client_mount_path }}/csi-driver-powerscale/csi-powerscale/{{ helm_charts_git }}"
        mode: "{{ permission_644 }}"

    - name: Get external-snapshotter git tar
      ansible.builtin.get_url:
        url: "{{ offline_git_path }}/external-snapshotter/{{ external_snapshotter_git }}"
        dest: "{{ k8s_client_mount_path }}/csi-driver-powerscale/csi-powerscale/{{ external_snapshotter_git }}"
        mode: "{{ permission_644 }}"

    - name: Transfer storage class template to nfs share
      ansible.builtin.template:
        src: ps_storage_class.j2
        dest: "{{ k8s_client_mount_path }}/csi-driver-powerscale/ps_storage_class.yml"
        owner: "{{ owner_value }}"
        group: "{{ group_value }}"
        mode: "{{ permission_644 }}"

    - name: Copy PowerScale CSI secret file to target path
      ansible.builtin.copy:
        src: "{{ csi_powerscale_driver_secret_file_path }}"
        dest: "{{ k8s_client_mount_path }}/csi-driver-powerscale/secret.yaml"
        mode: "0600"
      when:
        - csi_powerscale_driver_secret_file_path is defined
      no_log: true

    - name: Copy PowerScale CSI values file to target path
      ansible.builtin.copy:
        src: "{{ csi_powerscale_driver_values_file_path }}"
        dest: "{{ k8s_client_mount_path }}/csi-driver-powerscale/values.yaml"
        mode: "0644"
      when:
        - csi_powerscale_driver_values_file_path is defined

    - name: Copy empty certificate yaml file
      ansible.builtin.copy:
        dest: "{{ k8s_client_mount_path }}/csi-driver-powerscale/empty_isilon-certs.yaml"
        src: "{{ empty_certificate_template_path }}"
        mode: "{{ permission_644 }}"

    - name: Extract dell/helm-charts tar file under csi-powerscale directory
      ansible.builtin.unarchive:
        src: "{{ k8s_client_mount_path }}/csi-driver-powerscale/csi-powerscale/{{ helm_charts_git }}"
        dest: "{{ k8s_client_mount_path }}/csi-driver-powerscale/csi-powerscale"
        remote_src: true

    - name: Extract external snapshotter tar file under csi-powerscale directory
      ansible.builtin.unarchive:
        src: "{{ k8s_client_mount_path }}/csi-driver-powerscale/csi-powerscale/{{ external_snapshotter_git }}"
        dest: "{{ k8s_client_mount_path }}/csi-driver-powerscale/csi-powerscale"
        remote_src: true

  rescue:
    - name: Handle dependency failure
      ansible.builtin.fail:
        msg: "{{ fail_msg_download }}"


================================================
FILE: discovery/roles/k8s_config/tasks/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Creating the configuration files required for service_k8s in nfs share
  ansible.builtin.include_tasks: create_k8s_config_nfs.yml
  when: hostvars['localhost']['service_k8s_support']


================================================
FILE: discovery/roles/k8s_config/templates/ps_storage_class.j2
================================================
apiVersion: storage.k8s.io/v1
kind: StorageClass
metadata:
  name: ps01
provisioner: csi-isilon.dellemc.com
reclaimPolicy: Retain
allowVolumeExpansion: true
volumeBindingMode: Immediate
parameters:
  AccessZone: {{ ps_access_zone }}
  Isipath: {{ ps_isipath }}
  RootClientEnabled: "true"
  AzServiceIP: {{ ps_azserviceip }}
  csi.storage.k8s.io/fstype: "nfs"

================================================
FILE: discovery/roles/k8s_config/vars/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

local_repo_access_config_file: "/opt/omnia/provision/local_repo_access.yml"
input_project_dir: "{{ hostvars['localhost']['input_project_dir'] }}"
k8s_packages_file: "{{ input_project_dir }}/config/x86_64/{{ software_config.cluster_os_type }}/{{ software_config.cluster_os_version }}/service_k8s.json" # noqa: yaml[line-length]
calico_manifest_yaml_url: "{{ offline_manifest_path }}/{{ calico_package }}/{{ calico_package }}.yml"
metallb_manifest_yaml_url: "{{ offline_manifest_path }}/{{ metallb_package }}/{{ metallb_package }}.yml"
multus_manifest_yaml_url: "{{ offline_manifest_path }}/{{ multus_package }}/{{ multus_package }}.yml"
helm_tarball_url: "{{ offline_tarball_path }}/{{ helm_package }}/{{ helm_package }}.tar.gz"
nfs_client_provisioner_tarball_url: "{{ offline_tarball_path }}/{{ nfs_subdir_external_provisioner_pkg }}/{{ nfs_subdir_external_provisioner_pkg }}.tar.gz"
whereabouts_git_url: "{{ offline_git_path }}/{{ whereabouts_pkg }}/{{ whereabouts_pkg }}.tar.gz"
file_mode: "0644"
ha_config_file: "{{ input_project_dir }}/high_availability_config.yml"
pulp_webserver_cert_path: "/opt/omnia/pulp/settings/certs/pulp_webserver.crt"
anchors_path: "/etc/pki/ca-trust/source/anchors/pulp_webserver.crt"

# Usage: create_node_dir.yml
nodes_yaml: "{{ hostvars['localhost']['oim_shared_path'] }}/omnia/openchami/workdir/nodes/nodes.yaml"
worker_components:
  - 'kubernetes'
  - 'kubelet'
  - 'pod-logs'
worker_ips: "{{ worker_ip_list | unique }}"
cp_components:
  - 'etcd'
  - 'kubernetes'
  - 'kubelet'
  - 'pod-logs'
k8s_pip_packages: []
cp_ips: "{{ (cp_first_ip_list + cp_ip_list) | unique }}"
folder_mode: "0755"

# csi variables
csi_powerscale_git: "csi-powerscale.tar.gz"
fail_msg_download: "Failed to get required dependencies. Make sure to verify entries in csi_driver_powerscale.json and run local_repo.yml first."
helm_charts_git: "helm-charts.tar.gz"
external_snapshotter_git: "external-snapshotter.tar.gz"
empty_certificate_template_path: "{{ role_path }}/files/empty_certificate_template.yml"
permission_644: "0644"
owner_value: "root"
group_value: "root"
csi_powerscale_secret_vaultname: ".csi_powerscale_secret_vault"
vault_key_permission: "0644"

# Usage ps_storage_class.j2
ps_isipath: "{{ csi_powerscale_values_file['isiPath'] }}"
ps_access_zone: "{{ csi_powerscale_values_file['isiAccessZone'] }}"
ps_azserviceip: "{{ clusters.isilonClusters[0].endpoint | regex_replace('https?://', '') | regex_replace('/.*', '') }}"

nfs_export_help_msg: |
  Failed to create required subdirectories at '{{ k8s_client_mount_path }}'.
  Please check that the NFS server ({{ k8s_nfs_server_ip }}) is exporting the directory with correct permissions.
  Example /etc/exports line on your NFS server:

    {{ k8s_server_share_path }} *(rw,sync,no_root_squash,no_subtree_check)

  After updating /etc/exports
  1) Run 'exportfs -ra' on the NFS server and verify permissions/mounts
  2) Execute 'systemctl restart nfs-server'
  3) Rerun the playbook.

# Usage create_k8s_config_nfs.yml
packages_base_dir_x86_64: "{{ k8s_client_mount_path }}/packages/x86_64"
packages_base_dir_aarch64: "{{ k8s_client_mount_path }}/packages/aarch64"
offline_repo_basepath_x86_64: "{{ oim_shared_path }}/omnia/offline_repo/cluster/x86_64/rhel/{{ hostvars['localhost']['cluster_os_version'] }}/iso"
offline_repo_basepath_aarch64: "{{ oim_shared_path }}/omnia/offline_repo/cluster/aarch64/rhel/{{ hostvars['localhost']['cluster_os_version'] }}/iso"
packages_layout_x86_64:
  - cuda
packages_layout_aarch64:
  - cuda
print_copy_msg: "Copying {{ item.name }} from {{ item.source_path }} to {{ item.dest_path }}"
offline_path_x86_64: []
offline_path_aarch64: []
ssh_private_key_path: /root/.ssh/oim_rsa


================================================
FILE: discovery/roles/nfs_client/README.md
================================================
# NFS Client Role

## Overview
Configures NFS client mounts on cluster nodes based on their functional roles.

## Purpose
- Filters and mounts NFS shares based on node type (Slurm, Kubernetes)
- Configures NFS client packages
- Creates mount points and persistent `/etc/fstab` entries
- Supports bolt-on storage additions

## Key Tasks
- **Load Configuration**: Reads storage and software configuration
- **Filter Slurm Mounts**: Identifies NFS shares required for Slurm nodes
- **Filter K8s Mounts**: Identifies NFS shares required for Kubernetes service nodes
- **Install NFS Client**: Installs packages, creates mount points, updates `/etc/fstab`, mounts shares


================================================
FILE: discovery/roles/nfs_client/tasks/main.yml
================================================
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
- name: Include storage_config.yml file
  ansible.builtin.include_vars: "{{ storage_config_vars }}"

- name: Load software_config.json as software_config
  ansible.builtin.include_vars:
    file: "{{ software_config_file }}"
    name: software_config

- name: Check if slurm support is true
  ansible.builtin.set_fact:
    slurm_support: "{{ software_config.softwares | selectattr('name', 'in', ['slurm', 'slurm_custom']) | list | length > 0 }}"

- name: Check if service_k8s support is true
  ansible.builtin.set_fact:
    service_k8s_support: "{{ software_config.softwares | selectattr('name', 'in', ['service_k8s']) | list | length > 0 }}"

- name: Block for filtering slurm mounts
  when: ('slurm' in omnia_run_tags) and (slurm_support)
  block:
    - name: Include omnia_config
      ansible.builtin.include_vars:
        file: "{{ omnia_config_vars }}"
        name: omnia_config

    - name: Set facts for slurm
      ansible.builtin.set_fact:
        filter_slurm_nfs: "{{ omnia_config.slurm_cluster | map(attribute='nfs_storage_name') | list }}"

    - name: Select the nfs client parameters for slurm
      ansible.builtin.set_fact:
        slurm_nfs: "{{ nfs_client_params | selectattr('nfs_name', 'in', filter_slurm_nfs) | list }}"

    - name: Add the slurm nfs
      ansible.builtin.set_fact:
        storage_to_be_mounted: "{{ storage_to_be_mounted + slurm_nfs }}"

- name: Block for filtering service_k8s mounts
  when: ('service_k8s' in omnia_run_tags) and (service_k8s_support)
  block:
    - name: Include omnia_config
      ansible.builtin.include_vars:
        file: "{{ omnia_config_vars }}"
        name: omnia_config

    - name: Set facts for service_k8s
      ansible.builtin.set_fact:
        filter_service_k8s_nfs: "{{ omnia_config.service_k8s_cluster | map(attribute='nfs_storage_name') | list }}"

    - name: Select the nfs client parameters for service_k8s
      ansible.builtin.set_fact:
        service_k8s_nfs: "{{ nfs_client_params | selectattr('nfs_name', 'in', filter_service_k8s_nfs) | list }}"

    - name: Add the service_k8s nfs
      ansible.builtin.set_fact:
        storage_to_be_mounted: "{{ storage_to_be_mounted + service_k8s_nfs }}"

- name: Print nfs_storage_name
  ansible.builtin.debug:
    msg: "{{ storage_to_be_mounted }}"

- name: Install NFS client with bolt-on support
  ansible.builtin.include_tasks: nfs_client.yml
  with_items: "{{ storage_to_be_mounted }}"


================================================
FILE: discovery/roles/nfs_client/tasks/nfs_client.yml
================================================
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
- name: Initialize variable when client_share_path value is not given
  ansible.builtin.set_fact:
    client_mount_path: "{{ item.server_share_path }}"
  when: item.client_share_path | default("", true) | length < 1

- name: Initialize variable when client_share_path value is given
  ansible.builtin.set_fact:
    client_mount_path: "{{ item.client_share_path }}"
  when: item.client_share_path | default("", true) | length >= 1

- name: Fetch server_ip and server_share_path from list when nfs sever is not localhost
  ansible.builtin.set_fact:
    nfs_server_ip: "{{ item.server_ip }}"
  when: item.server_ip != "localhost"

- name: Fetch server_ip and server_share_path from list when nfs sever is localhost
  ansible.builtin.set_fact:
    nfs_server_ip: "{{ hostvars['127.0.0.1']['admin_nic_ip'] }}"
  when: item.server_ip == "localhost"

- name: Mount facts items to dict
  ansible.builtin.set_fact:
    nfs_src: "{{ nfs_server_ip }}:{{ item.server_share_path }}"

- name: Create the directory for mounting NFS client with server_share_path as client_share_path
  ansible.builtin.file:
    path: "{{ client_mount_path }}"
    state: directory
    mode: "{{ mounted_dir_perm }}"
  register: dir_check
  ignore_errors: true

- name: Mount NFS share
  block:
    - name: Mount NFS share with fstab entry # This task not failing if NFS server unreachable
      ansible.posix.mount:
        src: "{{ nfs_src }}"
        path: "{{ client_mount_path }}"
        opts: "{{ item.client_mount_options | default(default_client_mount_options) }}"
        state: mounted # This is needed to add entry to fstab
        fstype: nfs

    - name: Mount only the current nfs item # noqa: command-instead-of-module
      ansible.builtin.command: >
        mount -t nfs -o {{ item.client_mount_options | default(default_client_mount_options) }}
        {{ nfs_src }} {{ client_mount_path }}
      register: mount_result
      changed_when: mount_result.rc == 0
      failed_when: mount_result.rc != 0

  rescue:
    - name: Remove from fstab
      ansible.posix.mount:
        path: "{{ client_mount_path }}"
        state: absent_from_fstab

    - name: Fail if mount failed
      ansible.builtin.fail:
        msg: "{{ slurm_nfs_fail_msg }}"


================================================
FILE: discovery/roles/nfs_client/vars/main.yml
================================================
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# Usage: main.yml
storage_config_vars: "{{ hostvars['localhost']['input_project_dir'] }}/storage_config.yml"
storage_to_be_mounted: []
software_config_file: "{{ hostvars['localhost']['input_project_dir'] }}/software_config.json"
# Usage: nfs_client.yml
mounted_dir_perm: "0755"
default_client_mount_options: "nosuid,rw,sync,hard,intr"
slurm_nfs_fail_msg: "Failed to mount NFS share. Please check if the NFS server is reachable or NFS is configured properly."

omnia_config_vars: "{{ hostvars['localhost']['input_project_dir'] }}/omnia_config.yml"
omnia_run_tags: "{{ hostvars['localhost']['omnia_run_tags'] }}"


================================================
FILE: discovery/roles/openldap/README.md
================================================
# OpenLDAP Role

## Overview
Configures OpenLDAP connection parameters for centralized authentication.

## Purpose
- Builds LDAP search base from domain name
- Configures LDAP bind DN and connection parameters
- Sets up LDAP/LDAPS connection type

## Key Tasks
- **Extract Search Base**: Converts domain to LDAP format (e.g., `example.com` → `dc=example,dc=com`)
- **Set Server IP**: Extracts OpenLDAP server IP from configuration
- **Configure Connection**: Sets LDAP or LDAPS connection type
- **Build Bind DN**: Constructs admin bind DN for authentication


================================================
FILE: discovery/roles/openldap/tasks/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---


- name: Get the variables
  when: hostvars['localhost']['openldap_support']
  block:
    - name: Extract the domain name required by LDAP
      ansible.builtin.set_fact:
        ldap_search_base: "{{ (hostvars['localhost']['domain_name'].split('.') | map('regex_replace', '^', 'dc=') | list) | join(',') }}"

    - name: Set the server-ip required by LDAP
      ansible.builtin.set_fact:
        ldap_server_ip: "{{ hostvars['localhost']['Networks'][0]['admin_network']['primary_oim_admin_ip'] }}"

    - name: Set the ldap_connection_type required by LDAP
      ansible.builtin.set_fact:
        connection_type: "{{ (hostvars['localhost']['ldap_connection_type']) | lower }}"

    - name: Set the password required by LDAP
      ansible.builtin.set_fact:
        password: "{{ hostvars['localhost']['openldap_db_password'] }}"
      no_log: true

    - name: Set the ldap_connection_type required by LDAP
      ansible.builtin.set_fact:
        ldap_default_bind_dn: "cn={{ hostvars['localhost']['openldap_db_username'] }},{{ ldap_search_base }}"

  rescue:
    - name: Warn missing vars files
      ansible.builtin.fail:
        msg: "{{ openldap_fail_msg }}"


================================================
FILE: discovery/roles/openldap/vars/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

openldap_fail_msg: "Failed to set the openldap params."


================================================
FILE: discovery/roles/passwordless_ssh/tasks/build_host_lists.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
# tasks/build_host_lists.yml

- name: Ensure PXE mapping file path is set
  ansible.builtin.assert:
    that: pxe_mapping_file_path is defined
    fail_msg: "pxe_mapping_file_path is not defined. Check provision_config.yml."

- name: Read PXE mapping file (FUNCTIONAL_GROUP_NAME, HOSTNAME, ...)
  community.general.read_csv:
    path: "{{ pxe_mapping_file_path }}"
    key: ADMIN_MAC
  register: pxe_mapping_dict

- name: Initialize per-stack hostname lists and IP wildcard patterns
  ansible.builtin.set_fact:
    k8s_cluster_hostnames: []
    slurm_cluster_hostnames: []
    k8s_cluster_ip_patterns: []
    slurm_cluster_ip_patterns: []
    omnia_cluster_ip_patterns: []
    omnia_hosts_map: {}
  when: inventory_hostname == 'localhost'

- name: Build per-stack hostname lists and IP wildcard patterns from PXE mapping
  ansible.builtin.set_fact:
    k8s_cluster_hostnames: >-
      {{
        (k8s_cluster_hostnames + [item.value.HOSTNAME])
        if item.value.FUNCTIONAL_GROUP_NAME in k8s_functional_groups
        else k8s_cluster_hostnames
      }}
    slurm_cluster_hostnames: >-
      {{
        (slurm_cluster_hostnames + [item.value.HOSTNAME])
        if item.value.FUNCTIONAL_GROUP_NAME in slurm_functional_groups
        else slurm_cluster_hostnames
      }}
    k8s_cluster_ip_patterns: >-
      {{
        (k8s_cluster_ip_patterns + [ (item.value.ADMIN_IP | regex_replace('\\.[0-9]+$', '.*')) ])
        if (
          item.value.ADMIN_IP | default('') | length > 0 and
          item.value.FUNCTIONAL_GROUP_NAME in k8s_functional_groups
        )
        else k8s_cluster_ip_patterns
      }}
    slurm_cluster_ip_patterns: >-
      {{
        (slurm_cluster_ip_patterns + [ (item.value.ADMIN_IP | regex_replace('\\.[0-9]+$', '.*')) ])
        if (
          item.value.ADMIN_IP | default('') | length > 0 and
          item.value.FUNCTIONAL_GROUP_NAME in slurm_functional_groups
        )
        else slurm_cluster_ip_patterns
      }}
    omnia_cluster_ip_patterns: >-
      {{
        (omnia_cluster_ip_patterns + [ (item.value.ADMIN_IP | regex_replace('\\.[0-9]+$', '.*')) ])
        if (
          item.value.ADMIN_IP | default('') | length > 0 and
          (item.value.FUNCTIONAL_GROUP_NAME in k8s_functional_groups or
           item.value.FUNCTIONAL_GROUP_NAME in slurm_functional_groups)
        )
        else omnia_cluster_ip_patterns
      }}
    omnia_hosts_map: >-
      {{
        (omnia_hosts_map | default({}))
        | combine(
            ({ (item.value.HOSTNAME): item.value.ADMIN_IP }
             if (item.value.HOSTNAME | default('') | length > 0 and
                 item.value.ADMIN_IP | default('') | length > 0)
             else {}),
            recursive=False
          )
      }}
  loop: "{{ pxe_mapping_dict.dict | dict2items }}"
  loop_control:
    label: "{{ item.value.FUNCTIONAL_GROUP_NAME }} -> {{ item.value.HOSTNAME }} ({{ item.value.ADMIN_IP | default('no-ip') }})"

- name: Deduplicate host lists and IP wildcard patterns
  ansible.builtin.set_fact:
    k8s_cluster_hostnames: "{{ k8s_cluster_hostnames | unique }}"
    slurm_cluster_hostnames: "{{ slurm_cluster_hostnames | unique }}"
    k8s_cluster_ip_patterns: >-
      {{
        (k8s_cluster_ip_patterns | default([]))
        | map('regex_replace', '\\.[0-9]+$', '.*')
        | list
        | unique
      }}
    slurm_cluster_ip_patterns: >-
      {{
        (slurm_cluster_ip_patterns | default([]))
        | map('regex_replace', '\\.[0-9]+$', '.*')
        | list
        | unique
      }}
    omnia_cluster_ip_patterns: >-
      {{
        (omnia_cluster_ip_patterns | default([]))
        | map('regex_replace', '\\.[0-9]+$', '.*')
        | list
        | unique
      }}

- name: DEBUG passwordless_ssh facts built from PXE mapping
  ansible.builtin.debug:
    msg:
      k8s_cluster_hostnames: "{{ k8s_cluster_hostnames | default([]) }}"
      slurm_cluster_hostnames: "{{ slurm_cluster_hostnames | default([]) }}"
      k8s_cluster_ip_patterns: "{{ k8s_cluster_ip_patterns | default([]) }}"
      slurm_cluster_ip_patterns: "{{ slurm_cluster_ip_patterns | default([]) }}"
      omnia_cluster_ip_patterns: "{{ omnia_cluster_ip_patterns | default([]) }}"
      omnia_hosts_map: "{{ omnia_hosts_map | default({}) }}"


================================================
FILE: discovery/roles/passwordless_ssh/tasks/configure_oim_ssh.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
# tasks/configure_oim_ssh.yml

- name: Gather cluster hostnames and IP wildcard patterns from localhost facts
  ansible.builtin.set_fact:
    k8s_cluster_hostnames: "{{ hostvars['localhost']['k8s_cluster_hostnames'] | default([]) }}"
    slurm_cluster_hostnames: "{{ hostvars['localhost']['slurm_cluster_hostnames'] | default([]) }}"
    omnia_cluster_ip_patterns_raw: "{{ hostvars['localhost']['omnia_cluster_ip_patterns'] | default([]) }}"
    omnia_hosts_map: "{{ hostvars['localhost']['omnia_hosts_map'] | default({}) }}"

- name: Normalize OIM cluster IP patterns to wildcard subnets (x.x.x.*)
  ansible.builtin.set_fact:
    omnia_cluster_ip_patterns: >-
      {{
        (omnia_cluster_ip_patterns_raw | default([]))
        | map('regex_replace', '\\.[0-9]+$', '.*')
        | list
        | unique
      }}

- name: Build hostname wildcard patterns from actual cluster hostnames
  ansible.builtin.set_fact:
    omnia_cluster_hostname_patterns: >-
      {{
        (
          (k8s_cluster_hostnames | default([]))
          +
          (slurm_cluster_hostnames | default([]))
        )
        | map('regex_replace', '[0-9]+$', '*')
        | list
        | unique
      }}

- name: Build combined OIM SSH match list (hostname patterns + IP wildcard patterns)
  ansible.builtin.set_fact:
    omnia_cluster_ssh_matches: >-
      {{
        (omnia_cluster_hostname_patterns + omnia_cluster_ip_patterns)
        | map('regex_replace', '\.[0-9]+$', '.*')
        | list
        | unique
      }}


- name: Manage /etc/hosts entries on OIM for Omnia cluster nodes
  ansible.builtin.blockinfile:
    path: /etc/hosts
    create: true
    mode: '0644'
    marker: "# {mark} OMNIA_CLUSTER_NODES"
    block: |
      {% for h in omnia_hosts_map | dict2items %}
      {{ h.value }} {{ h.key }}
      {% endfor %}
  when: omnia_hosts_map | default({}) | length > 0

# - name: DEBUG configure_oim_ssh facts
 # ansible.builtin.debug:
    # msg:
     # k8s_cluster_hostnames: "{{ k8s_cluster_hostnames | default([]) }}"
      # slurm_cluster_hostnames: "{{ slurm_cluster_hostnames | default([]) }}"
      # omnia_cluster_ip_patterns_raw: "{{ omnia_cluster_ip_patterns_raw | default([]) }}"
      # omnia_cluster_ip_patterns: "{{ omnia_cluster_ip_patterns | default([]) }}"
      # omnia_cluster_hostname_patterns: "{{ omnia_cluster_hostname_patterns | default([]) }}"
      # omnia_cluster_ssh_matches: "{{ omnia_cluster_ssh_matches | default([]) }}"
      # omnia_hosts_map: "{{ omnia_hosts_map | default({}) }}"


================================================
FILE: discovery/roles/passwordless_ssh/tasks/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
# tasks/main.yml

- name: Build cluster host lists from PXE mapping (run on localhost/omnia_core)
  when: inventory_hostname == 'localhost'
  ansible.builtin.include_tasks: build_host_lists.yml

- name: Configure OIM SSH based on PXE mapping (run on oim)
  when: inventory_hostname == 'oim'
  ansible.builtin.include_tasks: configure_oim_ssh.yml


================================================
FILE: discovery/roles/passwordless_ssh/tasks/read_nodes_yaml.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# tasks/read_nodes_yaml.yml
---

- name: DEBUG passwordless_ssh facts from PXE mapping flow
  ansible.builtin.debug:
    msg:
      k8s_cluster_hostnames: "{{ hostvars['localhost']['k8s_cluster_hostnames'] | default([]) }}"
      slurm_cluster_hostnames: "{{ hostvars['localhost']['slurm_cluster_hostnames'] | default([]) }}"
      k8s_cluster_ip_patterns: "{{ hostvars['localhost']['k8s_cluster_ip_patterns'] | default([]) }}"
      slurm_cluster_ip_patterns: "{{ hostvars['localhost']['slurm_cluster_ip_patterns'] | default([]) }}"
      omnia_cluster_ip_patterns: "{{ hostvars['localhost']['omnia_cluster_ip_patterns'] | default([]) }}"
      omnia_hosts_map: "{{ hostvars['localhost']['omnia_hosts_map'] | default({}) }}"

- name: Set nodes.yaml path for nodes.yaml debugging
  ansible.builtin.set_fact:
    omnia_nodes_yaml_path: "{{ hostvars['localhost']['oim_shared_path'] }}/omnia/openchami/workdir/nodes/nodes.yaml"

- name: Read nodes.yaml for group/host/IP data
  ansible.builtin.slurp:
    src: "{{ omnia_nodes_yaml_path }}"
  register: omnia_nodes_yaml_raw

- name: Parse nodes.yaml content
  ansible.builtin.set_fact:
    omnia_nodes_data: "{{ omnia_nodes_yaml_raw.content | b64decode | from_yaml }}"

- name: Build groups, hostnames and admin IPs from nodes.yaml
  ansible.builtin.set_fact:
    omnia_nodes_groups_from_yaml: >-
      {{
        (omnia_nodes_data.nodes | default([]))
        | map(attribute='group')
        | list
        | unique
      }}

- name: Initialize all_group_names_present flag
  ansible.builtin.set_fact:
    all_group_names_present: false

- name: Set all_group_names_present when all required and optional groups are present
  ansible.builtin.set_fact:
    all_group_names_present: true
  when: >-
    (
      omnia_required_groups_from_nodes_yaml
      | difference(omnia_nodes_groups_from_yaml | default([]))
    ) | length == 0

- name: Build SSH Host pattern strings for k8s and slurm based on nodes.yaml completeness
  ansible.builtin.set_fact:
    k8s_ssh_patterns: >-
      {{
        '*'
        if (all_group_names_present | default(false))
        else (
          (
            (hostvars['localhost']['k8s_cluster_hostnames'] | default([]))
            | map('regex_replace', '[0-9]+$', '*')
            | list
            | unique
          )
          + (hostvars['localhost']['k8s_cluster_ip_patterns'] | default([]))
        )
        | unique
        | join(' ')
      }}
    slurm_ssh_patterns: >-
      {{
        '*'
        if (all_group_names_present | default(false))
        else (
          (
            (hostvars['localhost']['slurm_cluster_hostnames'] | default([]))
            | map('regex_replace', '[0-9]+$', '*')
            | list
            | unique
          )
          + (hostvars['localhost']['slurm_cluster_ip_patterns'] | default([]))
        )
        | unique
        | join(' ')
      }}

- name: Configure SSH on OIM with Host * when all groups are present in nodes.yaml
  ansible.builtin.blockinfile:
    path: "{{ ssh_private_key_path }}"
    create: true
    mode: '0600'
    marker: "# {mark} OMNIA_CLUSTER_SSH"
    block: |
      Host *
          IdentityFile ~/.ssh/oim_rsa
          IdentitiesOnly yes
  when: all_group_names_present

- name: Configure SSH on OIM with derived hostname/IP patterns when groups are incomplete
  ansible.builtin.blockinfile:
    path: "{{ ssh_private_key_path }}"
    create: true
    mode: '0600'
    marker: "# {mark} OMNIA_CLUSTER_SSH"
    block: |
      Host {{ omnia_cluster_ssh_matches
               | default([])
               | list
               | unique
               | join(' ') }}
          IdentityFile ~/.ssh/oim_rsa
          IdentitiesOnly yes
  when:
    - not all_group_names_present | default(false) | bool
    - omnia_cluster_ssh_matches | default([]) | length > 0

# - name: DEBUG summary from read_nodes_yaml flow
  # ansible.builtin.debug:
    # msg:
      # omnia_nodes_yaml_path: "{{ omnia_nodes_yaml_path }}"
      # omnia_nodes_groups_from_yaml: "{{ omnia_nodes_groups_from_yaml | default([]) }}"
      # all_group_names_present: "{{ all_group_names_present | default(false) }}"
      # omnia_cluster_ssh_matches: "{{ omnia_cluster_ssh_matches | default([]) }}"
      # k8s_ssh_patterns: "{{ k8s_ssh_patterns | default('') }}"
      # SLURM_SSH_patterns: "{{ slurm_ssh_patterns | default('') }}"


================================================
FILE: discovery/roles/passwordless_ssh/vars/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
# vars/main.yml

# K8s functional groups (x86_64 example; extend if you have aarch64 variants)
k8s_functional_groups:
  - service_kube_control_plane_first_x86_64
  - service_kube_control_plane_x86_64
  - service_kube_node_x86_64

# Slurm / login functional groups
slurm_functional_groups:
  - slurm_control_node_x86_64
  - slurm_node_x86_64
  - login_node_x86_64
  - login_compiler_node_x86_64
  - slurm_node_aarch64
  - login_node_aarch64
  - login_compiler_node_aarch64

# Nodes.yaml group completeness checks
omnia_required_groups_from_nodes_yaml:
  - service_kube_control_plane_first_x86_64
  - service_kube_control_plane_x86_64
  - service_kube_node_x86_64
  - slurm_control_node_x86_64
  - slurm_node_x86_64
  - login_node_x86_64
  - login_compiler_node_x86_64

omnia_optional_groups_from_nodes_yaml:
  - service_kube_control_plane_first_aarch64
  - service_kube_control_plane_aarch64
  - service_kube_node_aarch64
  - slurm_node_aarch64
  - login_node_aarch64
  - login_compiler_node_aarch64

ssh_private_key_path: /root/.ssh/config


================================================
FILE: discovery/roles/slurm_config/README.md
================================================
# Slurm Config Role

## Overview
Configures Slurm workload manager directory structures on NFS.

## Purpose
- Identifies Slurm nodes (control, compute, login)
- Creates shared Slurm directories on NFS
- Sets up directories for logs, spool files, and state information

## Key Tasks
- **Load Configuration**: Reads software configuration to check Slurm support
- **Identify Nodes**: Gets Slurm controller, compute, and login node hostnames
- **Create Directories**: Creates shared NFS directories for Slurm state, spool, and logs


================================================
FILE: discovery/roles/slurm_config/defaults/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
slurm_db_port_default: 3306
slurm_db_type_default: mariadb
slurm_db_username_default: root
slurmctld_service_default_path: '/usr/lib/systemd/system/slurmctld.service'
slurmd_service_default_path: '/usr/lib/systemd/system/slurmd.service'
slurmdbd_service_default_path: '/usr/lib/systemd/system/slurmdbd.service'
sys_env_path: '/etc/environment'
default_real_memory: 864
default_threadspercore: 1
default_corespersocket: 72
default_sockets: 2
share_prefix: "/"
conf_path_items: {}
conf_dict_items: {}

__default_config:
  cgroup:
    CgroupPlugin: autodetect
    ConstrainCores: 'yes'
    ConstrainDevices: 'yes'
    ConstrainRAMSpace: 'yes'
    ConstrainSwapSpace: 'yes'
  slurm:
    SlurmUser: "{{ slurm_user }}"
    SlurmctldPort: 6817
    SlurmdPort: 6818
    SrunPortRange: "60001-63000"
    StateSaveLocation: "/var/spool/slurmctld"
    SlurmdSpoolDir: "/var/spool/slurmd"
    SlurmctldParameters: "{{ slurm_ctld_parameters | join(',') }}"
    ReturnToService: 2
    SchedulerType: sched/backfill
    MpiDefault: none
    TaskPlugin: task/cgroup
    ProctrackType: proctrack/cgroup
    PrologFlags: contain
    JobAcctGatherType: jobacct_gather/linux
    JobAcctGatherFrequency: 30
    SelectType: select/cons_tres
    GresTypes: gpu
    SelectTypeParameters: CR_Core_Memory
    SlurmdParameters: l3cache_as_socket # Requires hwloc v2.
    SlurmctldLogFile: "/var/log/slurm/slurmctld.log"
    SlurmdLogFile: "/var/log/slurm/slurmd.log"
    SlurmctldPidFile: /var/run/slurmctld.pid
    SlurmdPidFile: /var/run/slurmd.pid
    AuthType: auth/munge
    CredType: cred/munge
    SlurmctldTimeout: 120
    SlurmdTimeout: 300
    Epilog: "/etc/slurm/epilog.d/logout_user.sh"
    PluginDir: "{{ plugin_slurm_dir }}"
    MaxNodeCount: 65000
    NodeSet:
      - NodeSet: "{{ slurm_partition_name }}"
        Feature: "{{ slurm_partition_name }}"
    NodeName:
      - NodeName: DEFAULT
        State: UNKNOWN
    PartitionName:
      - PartitionName: DEFAULT
        Nodes: ALL
        MaxTime: INFINITE
        State: UP
  slurmdbd:
    AuthType: auth/munge
    LogFile: "/var/log/slurm/slurmdbd.log"
    PidFile: /var/run/slurmdbd.pid
    SlurmUser: "{{ slurm_user }}"
    StorageType: accounting_storage/mysql
    StorageLoc: slurm_acct_db
    StoragePort: "{{ slurm_db_port }}"
    StorageUser: "{{ slurm_dbd_db_username }}"
    StoragePass: "{{ slurm_db_password }}"
    PluginDir: "{{ plugin_slurm_dir }}"
    DbdPort: "{{ slurm_dbd_port }}"
  gres:
    AutoDetect: nvml
  acct_gather: {}
  helpers: {}
  job_container: {}
  mpi: {}
  oci: {}
  topology: {}
  burst_buffer: {}


================================================
FILE: discovery/roles/slurm_config/tasks/backup_conf.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
- name: Backup Slurm configuration files when changed
  when:
    - ctld_conf_files is changed
    - ctld_list is defined
    - ctld_list | length > 0
  block:
    - name: Set backup timestamp
      ansible.builtin.set_fact:
        backup_timestamp: "{{ ansible_date_time.date }}_{{ ansible_date_time.time | replace(':', '-') }}"
        backup_base_name: "auto_backup_discovery"

    - name: Set backup name suffix
      ansible.builtin.set_fact:
        backup_name_suffix: "{{ backup_base_name ~ '_' ~ backup_timestamp }}"

    - name: Set backup directories
      ansible.builtin.set_fact:
        slurm_backups_root: "{{ share_path }}/slurm_backups"
        backup_dir: "{{ share_path }}/slurm_backups/{{ backup_base_name ~ '_' ~ backup_timestamp }}"

    - name: Ensure slurm backups root exists
      ansible.builtin.file:
        path: "{{ slurm_backups_root }}"
        state: directory
        mode: '0755'

    - name: Create backup directory
      ansible.builtin.file:
        path: "{{ backup_dir }}"
        state: directory
        mode: '0755'

    - name: Create backup config directories
      ansible.builtin.file:
        path: "{{ backup_dir }}/{{ ctld_list[0] }}/{{ item }}"
        state: directory
        mode: '0755'
      loop:
        - etc/slurm
        - etc/munge
        - etc/my.cnf.d

    - name: Backup controller config directories
      ansible.builtin.command: >-
        cp -a "{{ slurm_config_path }}/{{ ctld_list[0] }}/{{ item }}/." "{{ backup_dir }}/{{ ctld_list[0] }}/{{ item }}/"
      loop:
        - etc/slurm
        - etc/munge
        - etc/my.cnf.d
      changed_when: true
      failed_when: false

    - name: Display backup location
      ansible.builtin.debug:
        msg: "Slurm config backup created at: {{ backup_dir }}/{{ ctld_list[0] }}"


================================================
FILE: discovery/roles/slurm_config/tasks/build_slurm_conf.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
- name: Append node_params list into NodeName list
  ansible.builtin.set_fact:
    apply_config: "{{ apply_config | default({})
     | combine({'slurm': (apply_config['slurm']
     | combine({'NodeName': (apply_config['slurm'].NodeName | default([])) + (node_params | default([]))}))}) }}"
  when: node_params is defined and node_params
  no_log: "{{ _no_log }}"

- name: Append login nodes to NodeName list
  ansible.builtin.set_fact:
    apply_config: "{{ apply_config | default({})
     | combine({'slurm': (apply_config['slurm']
     | combine({'NodeName': (apply_config['slurm'].NodeName | default([])) + [{'NodeName': item}]}))}) }}"
  loop: "{{ login_list }}"
  when: login_list is defined and login_list
  no_log: "{{ _no_log }}"

- name: Append compiler login nodes to NodeName list
  ansible.builtin.set_fact:
    apply_config: "{{ apply_config | default({})
     | combine({'slurm': (apply_config['slurm']
     | combine({'NodeName': (apply_config['slurm'].NodeName | default([])) + [{'NodeName': item}]}))}) }}"
  loop: "{{ compiler_login_list }}"
  when: compiler_login_list is defined and compiler_login_list
  no_log: "{{ _no_log }}"

- name: Append Partition
  ansible.builtin.set_fact:
    apply_config: "{{ apply_config | default({})
     | combine({'slurm': (apply_config['slurm']
     | combine({'PartitionName': (apply_config['slurm'].PartitionName | default([])) + [partition_params]}))}) }}"
  when: node_params is defined and node_params
  no_log: "{{ _no_log }}"

- name: Add dbd parameters to slurm conf
  ansible.builtin.set_fact:
    apply_config: "{{ apply_config | default({}) | combine({'slurm': (apply_config['slurm'] | combine(dbd_slurm_conf))}) }}"
  when: dbd_list is defined and dbd_list
  no_log: "{{ _no_log }}"


================================================
FILE: discovery/roles/slurm_config/tasks/check_ctld_running.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
- name: Check if remote host is reachable via SSH
  ansible.builtin.wait_for:
    host: "{{ ctld }}"
    port: 22 # TODO: make it configurable
    timeout: 10
    state: started
  delegate_to: localhost
  register: ssh_check
  ignore_errors: true

- name: Enter slurm controller when pingable
  when:
    - ssh_check is success
  ignore_unreachable: true
  block:
    - name: Initialize ctld_state dict
      ansible.builtin.set_fact:
        ctld_state: "{{ ctld_state | default({}) | combine({ctld: false}) }}"

    - name: Check if slurmctld is running on remote host
      ansible.builtin.service_facts:
      delegate_to: "{{ ctld }}"
      register: service_facts
      ignore_unreachable: true

    - name: Check slurmctld is reachable
      ansible.builtin.fail:
        msg: "Failed to connect to {{ ctld }}."
      when: service_facts is unreachable

    - name: Update ctld_state if slurmctld is running
      ansible.builtin.set_fact:
        ctld_state: "{{ ctld_state | combine({ctld: true}) }}"
      when:
        - service_facts is success
        - ansible_facts.services['slurmctld.service'] is defined
        - ansible_facts.services['slurmctld.service'].state == 'running'

    - name: Check reachability of hosts in ip_name_map
      ansible.builtin.wait_for:
        host: "{{ host }}"
        port: 22
        timeout: 10
        state: started
      delegate_to: localhost
      loop: "{{ ip_name_map.values() | list }}"
      loop_control:
        loop_var: host
      register: ip_map_ssh_check
      ignore_errors: true
      ignore_unreachable: true

    - name: Build list of reachable hosts from ip_name_map
      ansible.builtin.set_fact:
        reachable_hosts: "{{ ip_map_ssh_check.results | rejectattr('failed', 'true') | map(attribute='host') | list }}"

    - name: Update basics on reachable_hosts
      ansible.builtin.include_tasks: update_hosts_munge.yml
      loop: "{{ reachable_hosts }}"
      loop_control:
        loop_var: slurmhost_ip

    - name: Trigger the scontrol reconfigure
      ansible.builtin.command: scontrol reconfigure
      changed_when: scontrol_reconfig.rc == 0
      failed_when: false
      register: scontrol_reconfig
      delegate_to: "{{ ctld }}"
      when:
        - ctld_state[ctld] is true

    - name: Undrain if any nodes are drain
      ansible.builtin.command:
        cmd: |
          for drained_node in $(sinfo --states=drain,draining,down --noheader -o "%N"); do
              scontrol update NodeName=$drained_node State=RESUME
          done
      changed_when: scontrol_node_resume.rc == 0
      failed_when: false
      register: scontrol_node_resume
      delegate_to: "{{ ctld }}"
      when:
        - ctld_state[ctld] is true

  rescue:
    - name: Fail if slurmctld is not running on any host
      ansible.builtin.debug:
        msg: "Failed to 'scontrol reconfigure' on {{ ctld }}.
         As task '{{ ansible_failed_task.name }}' failed.
         results: {{ ansible_failed_result }}"


================================================
FILE: discovery/roles/slurm_config/tasks/confs.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
- name: Slurm dict ops
  ansible.builtin.set_fact:
    apply_config: "{{ __default_config }}"
  no_log: "{{ _no_log }}"

- name: Remove keys from conf_files if they have string values in configs_input (when skip_merge is true)
  ansible.builtin.set_fact:
    conf_files: "{{ conf_files | difference(configs_input | dict2items | selectattr('value', 'string') | map(attribute='key') | list) }}"
  when:
    - skip_merge | default(false)
    - configs_input is defined

- name: Initialize node_params collection
  ansible.builtin.set_fact:
    node_params: []

- name: Set discovery mode and get groups with specs
  ansible.builtin.set_fact:
    discovery_mode: "{{ (slurm_cluster[0].node_discovery_mode | default('heterogeneous')) | lower }}"
    groups_with_specs: "{{ slurm_cluster[0].node_hardware_defaults | default({}) | list }}"

- name: DEBUG - Show discovery configuration
  ansible.builtin.debug:
    msg:
      - "Discovery Mode: {{ discovery_mode }}"
      - "Groups with specs: {{ groups_with_specs }}"
      - "Total compute nodes: {{ cmpt_list | length }}"
      - "Node-to-hardware-group mapping: {{ name_hardware_group_map }}"

- name: Categorize nodes for processing (homogeneous mode)
  ansible.builtin.set_fact:
    homogeneous_nodes: []
    sample_idrac_groups: {}
  when: discovery_mode == 'homogeneous'

- name: DEBUG - Show node group checking details
  ansible.builtin.debug:
    msg:
      - "Node: {{ item }}"
      - "Hardware Group: {{ name_hardware_group_map.get(item, 'NOT_FOUND') }}"
      - "Groups with specs: {{ groups_with_specs }}"
      - "Is in specs: {{ name_hardware_group_map.get(item, '') in groups_with_specs }}"
  loop: "{{ cmpt_list }}"
  when:
    - discovery_mode == 'homogeneous'
    - name_hardware_group_map | length > 0

- name: Build homogeneous nodes list (groups with specs)
  ansible.builtin.set_fact:
    homogeneous_nodes: >-
      {{
        homogeneous_nodes + [item]
        if (name_hardware_group_map.get(item, '') in groups_with_specs)
        else homogeneous_nodes
      }}
  loop: "{{ cmpt_list }}"
  when:
    - discovery_mode == 'homogeneous'
    - name_hardware_group_map | length > 0

- name: DEBUG - Show homogeneous nodes categorization
  ansible.builtin.debug:
    msg:
      - "Homogeneous nodes (with user specs): {{ homogeneous_nodes | default([]) }}"
      - "Nodes count: {{ homogeneous_nodes | default([]) | length }}"
      - "Will process homogeneous task: {{ (discovery_mode == 'homogeneous' and homogeneous_nodes | length > 0) }}"
  when: discovery_mode == 'homogeneous'

- name: DEBUG - About to process homogeneous nodes
  ansible.builtin.debug:
    msg: "Processing {{ homogeneous_nodes | length }} nodes with user specs: {{ homogeneous_nodes }}"
  when:
    - discovery_mode == 'homogeneous'
    - homogeneous_nodes | length > 0

- name: Process homogeneous groups with user specs (no iDRAC)
  ansible.builtin.include_tasks: read_node_homogeneous.yml
  loop: "{{ homogeneous_nodes }}"
  loop_control:
    loop_var: item
  when:
    - discovery_mode == 'homogeneous'
    - homogeneous_nodes | length > 0

- name: Build sample iDRAC groups mapping (groups without specs)
  ansible.builtin.set_fact:
    sample_idrac_groups: >-
      {{
        sample_idrac_groups | default({}) |
        combine({
          name_hardware_group_map.get(item, ''): sample_idrac_groups.get(name_hardware_group_map.get(item, ''), []) + [item]
        })
      }}
  loop: "{{ cmpt_list }}"
  when:
    - discovery_mode == 'homogeneous'
    - name_hardware_group_map | length > 0
    - name_hardware_group_map.get(item, '') not in groups_with_specs

- name: Process homogeneous groups with user specs (no iDRAC)
  ansible.builtin.include_tasks: read_node_homogeneous.yml
  loop: "{{ homogeneous_nodes }}"
  when:
    - discovery_mode == 'homogeneous'
    - homogeneous_nodes | length > 0

- name: Process homogeneous groups without specs (group iDRAC)
  ansible.builtin.include_tasks: read_node_idrac_group.yml
  loop: "{{ sample_idrac_groups | dict2items }}"
  loop_control:
    loop_var: group_item
  when:
    - discovery_mode == 'homogeneous'
    - sample_idrac_groups | default({}) | length > 0

- name: Process heterogeneous nodes (individual iDRAC)
  ansible.builtin.include_tasks: read_node_idrac.yml
  loop: "{{ cmpt_list }}"
  when:
    - discovery_mode == 'heterogeneous'

- name: DEBUG - Show final node_params before building slurm.conf
  ansible.builtin.debug:
    msg:
      - "Total node_params entries: {{ node_params | length }}"
      - "node_params: {{ node_params }}"

- name: Build slurm.conf
  ansible.builtin.include_tasks: build_slurm_conf.yml
  when: "'slurm' in conf_files"

- name: Slurm dbd opts
  ansible.builtin.set_fact:
    apply_config: "{{ apply_config | default({})
     | combine({'slurmdbd': (apply_config['slurmdbd']
     | combine({'DbdHost': ctld_list[0], 'StorageHost': ctld_list[0]}))}) }}"
  when: ctld_list
  no_log: "{{ _no_log }}"

- name: Check .conf files existence
  ansible.builtin.stat:
    path: "{{ slurm_config_path }}/{{ item.0 }}/etc/slurm/{{ item.1 }}.conf"
  when: ctld_list
  loop: "{{ ctld_list | product(conf_files | default([])) }}"
  register: ctld_conf_files

- name: Parse configs_input files from localhost (if they are paths)
  slurm_conf:
    op: parse
    conf_name: "{{ item.key }}"
    path: "{{ item.value }}"
  delegate_to: localhost
  loop: "{{ configs_input | default({}) | dict2items }}"
  register: parsed_configs_input_results
  no_log: "{{ _no_log }}"
  when:
    - configs_input is defined
    - configs_input
    - item.value is string
    - item.key in conf_files

- name: Build parsed_configs_input dictionary from parsed files
  ansible.builtin.set_fact:
    parsed_configs_input: "{{ parsed_configs_input | default({}) | combine({item.item.key: item.conf_dict}) }}"
  loop: "{{ parsed_configs_input_results.results }}"
  no_log: "{{ _no_log }}"
  when:
    - parsed_configs_input_results is defined
    - not item.skipped | default(false)

- name: Add configs_input dicts that are already parsed
  ansible.builtin.set_fact:
    parsed_configs_input: "{{ parsed_configs_input | default({}) | combine({item.key: item.value}) }}"
  loop: "{{ configs_input | default({}) | dict2items }}"
  no_log: "{{ _no_log }}"
  when:
    - configs_input is defined
    - configs_input
    - item.value is mapping

- name: Create lists for conf_merge
  ansible.builtin.set_fact:
    conf_merge_dict: "{{
        conf_merge_dict | default({})
        | combine({
            existing_conf_set.item.1: (
              ([existing_conf_set.stat.path] if existing_conf_set.stat.exists else [])
              + [apply_config[existing_conf_set.item.1]]
              + ([parsed_configs_input.get(existing_conf_set.item.1)]
               if parsed_configs_input is defined and parsed_configs_input.get(existing_conf_set.item.1) else [])
            )
          })
      }}"
  loop: "{{ ctld_conf_files.results }}"
  loop_control:
    loop_var: existing_conf_set
  register: prepared_conf_lists
  no_log: "{{ _no_log }}"

# All the updates to the confs follow after this point before merge
- name: Prepend ClusterName and SlurmctldHost to slurm conf sources
  ansible.builtin.set_fact: # TODO: Change order if needed
    conf_merge_dict: "{{ conf_merge_dict
     | combine({'slurm': [{'ClusterName': cluster_name, 'AccountingStorageHost': dbd_list[0], 'SlurmctldHost': ctld_list}] + conf_merge_dict['slurm']}) }}"
  when: "'slurm' in conf_merge_dict"
  no_log: "{{ _no_log }}"

- name: Slurm dbd - DbdHost and StorageHost
  ansible.builtin.set_fact:
    conf_merge_dict: "{{ conf_merge_dict
     | combine({'slurmdbd': [{'DbdHost': ctld_list[0], 'StorageHost': ctld_list[0]}] + conf_merge_dict['slurmdbd']}) }}"
  when: "'slurmdbd' in conf_merge_dict"
  no_log: "{{ _no_log }}"

- name: Merge the confs
  slurm_conf:
    op: merge
    conf_sources: "{{ item.value }}"
    conf_name: "{{ item.key }}"
  loop: "{{ conf_merge_dict | dict2items }}"
  register: merged_conf
  no_log: "{{ _no_log }}"

- name: Update slurm_conf_dict with merged configuration for cloud_init read. # TODO: Remove cloud init dependency
  ansible.builtin.set_fact:
    slurm_conf_dict: "{{ (merged_conf.results | selectattr('item.key', 'equalto', 'slurm') | first).conf_dict }}"
  when: "'slurm' in conf_merge_dict"

- name: Extract effective path parameters from merged configs
  ansible.builtin.include_tasks: extract_path_overrides.yml

- name: Validate path parameters are absolute
  ansible.builtin.include_tasks: validate_path_overrides.yml

- name: Get nodes from normal partition and compare with cmpt_list
  ansible.builtin.set_fact:
    normal_partition: "{{ slurm_conf_dict.PartitionName | default([]) | selectattr('PartitionName', 'equalto', slurm_partition_name) | first | default({}) }}"
  when: "'slurm' in conf_merge_dict"

- name: Parse normal partition nodes and compare
  ansible.builtin.set_fact:
    normal_partition_nodes: "{{ (normal_partition.Nodes | default('ALL')).split(',') | map('trim') | reject('equalto', 'ALL') | list }}"
    nodes_in_normal_not_in_cmpt: "{{ (normal_partition.Nodes | default('ALL')).split(',')
     | map('trim') | reject('equalto', 'ALL') | list | difference(cmpt_list) }}"
  when:
    - "'slurm' in conf_merge_dict"
    - normal_partition is defined
    - normal_partition | length > 0

- name: Detect busy nodes
  ansible.builtin.include_tasks: detect_busy_nodes.yml
  loop: "{{ nodes_in_normal_not_in_cmpt }}"
  loop_control:
    loop_var: node_to_remove
  when:
    - not force_scancel_node
    - "'slurm' in conf_merge_dict"
    - nodes_in_normal_not_in_cmpt is defined
    - nodes_in_normal_not_in_cmpt | length > 0

- name: Prompt for user input when jobs are running
  ansible.builtin.pause:
    prompt: |
      ================================================================================
      WARNING: ACTIVE JOBS DETECTED ON THE FOLLOWING NODES
      ================================================================================

      Busy Nodes:
      {% for node, jobs in busy_nodes.items() %}
        - {{ node }}: {{ jobs }} running job(s)
      {% endfor %}

      These nodes has active running jobs.
      All other nodes without jobs will be removed.

      To view job details, run:
      {% for node in busy_nodes.keys() %}
        squeue -w {{ node }}
      {% endfor %}

      Available Options:
        A. ABORT (Recommended)
            - Remove the IDLE nodes from the cluster and abort this playbook
            - Manually cancel jobs or wait for them to complete
            - Then re-run this playbook to remove these nodes

        F. FORCE REMOVAL (Destructive)
            - All running jobs will be forcefully terminated
            - Users will lose any unsaved work

      ================================================================================
      Enter 'A' to abort, or 'F' to force remove:
  register: user_input
  until: user_input.user_input | default('') | trim | upper in ['A', 'F']
  retries: 10
  delay: 1
  when:
    - busy_nodes is defined
    - busy_nodes | length > 0
    - not force_scancel_node

- name: Remove busy_nodes from nodes_in_normal_not_in_cmpt
  ansible.builtin.set_fact:
    nodes_in_normal_not_in_cmpt: "{{ nodes_in_normal_not_in_cmpt | difference(busy_nodes.keys() | list) }}"
  when:
    - busy_nodes is defined
    - busy_nodes | length > 0
    - user_input.user_input | default('') | trim | upper == 'A'

- name: Empty Busy nodes for Force removal
  ansible.builtin.set_fact:
    busy_nodes: {}
  when:
    - busy_nodes is defined
    - busy_nodes | length > 0
    - user_input.user_input | default('') | trim | upper == 'F'

- name: Remove nodes
  ansible.builtin.include_tasks: remove_node.yml
  when:
    - "'slurm' in conf_merge_dict"
    - nodes_in_normal_not_in_cmpt is defined
    - nodes_in_normal_not_in_cmpt | length > 0

- name: Create directories from conf values (NFS server-side always uses defaults)
  ansible.builtin.include_tasks: exist_dir.yml
  loop:
    - "{{ ctld_list
     | product(['/var/spool/slurmctld',
      '/var/log/slurm',
      '/var/run']) }}"
    - "{{ (cmpt_list + login_list + compiler_login_list)
     | product(['/var/spool/slurmd',
      '/var/log/slurm',
      '/var/run']) }}"
  loop_control:
    loop_var: product

- name: Generate slurmd opts for Configless # TODO: Move to $SLURMD_OPTIONS /etc/default/slurmd
  ansible.builtin.set_fact:
    conf_server: "--conf-server {{ ctld_list | map('regex_replace', '$', ':' ~ (slurm_conf_dict.get('SlurmctldPort', '6817') | string)) | join(',') }}"
  when: slurm_conf_dict is defined

- name: Write merged .conf
  ansible.builtin.copy:
    content: "{{ item.ini_lines | join('\n') }}\n"
    dest: "{{ slurm_config_path }}/{{ ctld_list[0] }}/etc/slurm/{{ item.item.key }}.conf"
    mode: "{{ slurm_dbd_mode if item.item.key == 'slurmdbd' else slurm_mode }}"
    owner: "{{ slurm_user }}"
    group: "{{ slurm_user_group }}"
    remote_src: "{{ copy_from_oim }}"
  loop: "{{ merged_conf.results }}"
  register: ctld_conf_files
  no_log: "{{ _no_log }}"
  when:
    - item.ini_lines

- name: Add extra confs which are not handled
  ansible.builtin.include_tasks: handle_extra_confs.yml
  when:
    - configs_input is defined
    - configs_input.keys() | difference(conf_files) | length > 0
  loop: "{{ configs_input.keys() | difference(conf_files) }}"
  loop_control:
    loop_var: extra_conf

- name: Backup Slurm configuration files when changed
  ansible.builtin.include_tasks: backup_conf.yml

- name: Check if cluster running
  ansible.builtin.include_tasks: check_ctld_running.yml
  when:
    - ctld_list
    - ctld_conf_files is changed
  loop: "{{ ctld_list }}"
  loop_control:
    loop_var: ctld

- name: Handle user choice - ABORT
  ansible.builtin.fail:
    msg:
      - "==============================================================================="
      - "PLAYBOOK ABORTED BY USER"
      - "==============================================================================="
      - "You chose to abort the playbook (Option A)."
      - "Next Steps:"
      - "1. Cancel running jobs manually: 'scancel -w <node_name>'"
      - "2. Or wait for jobs to complete naturally"
      - "3. Re-run this playbook to remove the nodes"
      - "Idle nodes (if any) have already been removed from the cluster."
      - "==============================================================================="
  when:
    - busy_nodes is defined
    - busy_nodes | length > 0
    - not force_scancel_node
    - user_input.user_input | default('') | trim | upper in ['A']


================================================
FILE: discovery/roles/slurm_config/tasks/create_slurm_dir.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
- name: Include variable file omnia_config.yml
  ansible.builtin.include_vars: "{{ input_project_dir }}/omnia_config.yml"

- name: Include storage vars
  ansible.builtin.include_vars: "{{ input_project_dir }}/storage_config.yml"

- name: Load slurm_custom.json for x86_64
  ansible.builtin.include_vars:
    file: "{{ input_project_dir }}/config/x86_64/rhel/{{ hostvars['localhost']['cluster_os_version'] }}/slurm_custom.json"
    name: slurm_custom_x86_64
  failed_when: false

- name: Load slurm_custom.json for aarch64
  ansible.builtin.include_vars:
    file: "{{ input_project_dir }}/config/aarch64/rhel/{{ hostvars['localhost']['cluster_os_version'] }}/slurm_custom.json"
    name: slurm_custom_aarch64
  failed_when: false

- name: Extract CUDA runfile name for x86_64 from slurm_custom.json
  ansible.builtin.set_fact:
    cuda_runfile_x86_64: "{{ (slurm_custom_x86_64.slurm_node.cluster | selectattr('package', 'equalto', 'cuda-run') | first).url | basename }}"
  when:
    - slurm_custom_x86_64 is defined
    - slurm_custom_x86_64.slurm_node is defined
    - slurm_custom_x86_64.slurm_node.cluster | selectattr('package', 'equalto', 'cuda-run') | list | length > 0

- name: Extract CUDA runfile name for aarch64 from slurm_custom.json
  ansible.builtin.set_fact:
    cuda_runfile_aarch64: "{{ (slurm_custom_aarch64.slurm_node.cluster | selectattr('package', 'equalto', 'cuda-run') | first).url | basename }}"
  when:
    - slurm_custom_aarch64 is defined
    - slurm_custom_aarch64.slurm_node is defined
    - slurm_custom_aarch64.slurm_node.cluster | selectattr('package', 'equalto', 'cuda-run') | list | length > 0

- name: Set facts for slurm
  ansible.builtin.set_fact:
    nfs_storage_name: "{{ slurm_cluster[0].nfs_storage_name }}"

- name: Read the slurm mount point
  ansible.builtin.set_fact:
    share_path: "{{ (nfs_client_params | selectattr('nfs_name', 'equalto', nfs_storage_name) | first).client_share_path }}"
    nfs_server_ip: "{{ (nfs_client_params | selectattr('nfs_name', 'equalto', nfs_storage_name) | first).server_ip }}"
    nfs_server_path: "{{ (nfs_client_params | selectattr('nfs_name', 'equalto', nfs_storage_name) | first).server_share_path }}"

- name: Set facts for slurm
  ansible.builtin.set_fact:
    cluster_name: "{{ slurm_cluster[0].cluster_name }}"
    configs_input: "{{ slurm_cluster[0].config_sources | default({}) | dict2items | rejectattr('value', 'falsy') | list | items2dict }}"
    skip_merge: "{{ slurm_cluster[0].skip_merge | default(false) }}"
    slurm_config_path: "{{ share_path }}/{{ slurm_dir_name }}"
    controller_trackfile_path: "{{ share_path }}/ctld_track"

- name: Configure openldap if supported
  ansible.builtin.include_tasks: openldap_config.yml
  when: hostvars['localhost']['openldap_support']

- name: Create slurm group
  ansible.builtin.group:
    name: "{{ slurm_user_group }}"
    gid: "{{ slurm_uid }}"

- name: Create slurm User
  ansible.builtin.user:
    name: "{{ slurm_user }}"
    uid: "{{ slurm_uid }}"
    group: "{{ slurm_user_group }}"
    create_home: false

- name: Set facts for slurm
  ansible.builtin.set_fact:
    share_prefix: "{{ slurm_config_path }}"
  when: conf_in_nfs

- name: Clear Slurm-related files and directories
  ansible.builtin.file:
    path: "{{ slurm_config_path }}/{{ slurm_item }}"
    state: absent
  loop: "{{ (ctld_list | default([])
   + cmpt_list | default([])
   + login_list | default([])
   + compiler_login_list | default([])
   + dbd_list | default([])
   + ['munge.key']) | flatten }}"
  loop_control:
    loop_var: slurm_item
  failed_when: false
  when:
    - clear_slurm_files

- name: Create the slurm directory in share
  ansible.builtin.file:
    path: "{{ slurm_config_path }}"
    state: directory
    owner: root
    group: root
    mode: "{{ common_mode }}"

# This directory is created to store the controller track file in NFS
# The track file is generated only after the Slurm controller has been fully configured in a fresh deployment
- name: Create directory for controller init track file in share
  ansible.builtin.file:
    path: "{{ controller_trackfile_path }}"
    state: directory
    owner: root
    group: root
    mode: "{{ common_mode }}"

- name: Create all common directories
  ansible.builtin.include_tasks: exist_dir.yml
  loop:
    - "{{ (ctld_list + cmpt_list + login_list + compiler_login_list) | product(common_dir) }}"
    - "{{ ctld_list | product(ctld_dir) }}"
    - "{{ dbd_list | product(db_dir) }}"
    - "{{ (cmpt_list + login_list + compiler_login_list) | product(cmpt_dir) }}"
  loop_control:
    loop_var: product

- name: Create the cert directory on share
  ansible.builtin.file:
    path: "{{ slurm_config_path }}/cert"
    state: directory
    owner: root
    group: root
    mode: "{{ common_mode }}"

- name: Copy pulp webserver certificate to client_share_path
  ansible.builtin.copy:
    src: "{{ pulp_webserver_cert_path }}"
    dest: "{{ slurm_config_path }}/cert"
    mode: "{{ file_mode }}"
  become: true

- name: Create hpc tools dirs
  ansible.builtin.include_tasks: hpc_tools.yml

- name: Check if munge key exists top level
  ansible.builtin.stat:
    path: "{{ slurm_config_path }}/munge.key"
  register: munge_present

- name: Ensure munge key is generated
  ansible.builtin.shell: "{{ munge_key_cmd }} > {{ slurm_config_path }}/munge.key"
  when: not munge_present.stat.exists
  register: munge_gen
  changed_when: munge_gen.rc == 0

- name: Distribute the munge key
  ansible.builtin.copy:
    src: "{{ slurm_config_path }}/munge.key"
    dest: "{{ slurm_config_path }}/{{ item }}/etc/munge/munge.key"
    mode: "0600"
    remote_src: true
  register: munge_key_copy
  loop: "{{ (ctld_list | default([])) +
            (cmpt_list | default([])) +
            (compiler_login_list | default([])) +
            (login_list | default([])) }}"

- name: Conf merge and write using slurm_conf module
  ansible.builtin.include_tasks: confs.yml

- name: Create mariadb cnf
  ansible.builtin.template:
    src: "mariadb-server.cnf.j2"
    dest: "{{ slurm_config_path }}/{{ item }}/etc/my.cnf.d/mariadb-server.cnf"
    owner: "{{ root_user }}"
    group: "{{ root_group }}"
    mode: "{{ conf_file_mode }}"
  when: ctld_list
  loop: "{{ ctld_list }}"

- name: Generate slurmd opts for Configless
  ansible.builtin.set_fact:
    conf_server: "--conf-server {{ ctld_list | map('regex_replace', '$', ':' ~ (apply_config['slurm']['SlurmctldPort'] | string)) | join(',') }}"

- name: Create epilog.sh and slurmd.service
  ansible.builtin.template:
    src: "{{ item.1 }}.j2"
    dest: "{{ slurm_config_path }}/{{ item.0 }}/etc/slurm/epilog.d/{{ item.1 }}"
    owner: "{{ root_user }}"
    group: "{{ root_group }}"
    mode: "{{ common_mode }}"
  when: cmpt_list
  loop: "{{ cmpt_list | product(['logout_user.sh']) }}"

- name: Get the slurm NFS path
  ansible.builtin.debug:
    msg: "The slurm NFS path is {{ share_path }}/slurm"

- name: NFS path for cloud init
  ansible.builtin.set_fact:
    cloud_init_nfs_path: "{{ nfs_server_ip }}:{{ nfs_server_path }}/slurm"

- name: NFS path for controller trackfile
  ansible.builtin.set_fact:
    trackfile_nfs_path: "{{ nfs_server_ip }}:{{ nfs_server_path }}/ctld_track"

- name: NFS path for cloud init
  ansible.builtin.set_fact:
    cloud_init_nfs_path_openldap: "{{ nfs_server_ip }}:{{ nfs_server_path }}/openldap"
  when: hostvars['localhost']['openldap_support']

# This will be mounted for ucx, openmpi and ldms configurations on slurm nodes
- name: NFS path for ucx, openmpi and ldms cloud init
  ansible.builtin.set_fact:
    cloud_init_slurm_nfs_path: "{{ nfs_server_ip }}:{{ nfs_server_path }}"
    client_mount_path: "{{ share_path }}"

- name: Ensure SSH key directory exists on Slurm share
  ansible.builtin.file:
    path: "{{ slurm_config_path }}/ssh"
    state: directory
    owner: root
    group: root
    mode: '0700'

- name: Copy OIM private key to Slurm share for node-to-node SSH
  ansible.builtin.copy:
    src: "{{ ssh_private_key_path }}"
    dest: "{{ slurm_config_path }}/ssh/oim_rsa"
    owner: root
    group: root
    mode: '0600'


================================================
FILE: discovery/roles/slurm_config/tasks/detect_busy_nodes.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
- name: Check if node exists in Slurm cluster
  ansible.builtin.command: scontrol show node {{ node_to_remove }}
  register: node_exists_check
  failed_when: false
  ignore_unreachable: true
  changed_when: false
  delegate_to: "{{ ctld_list[0] }}"

- name: Skip if node does not exist
  ansible.builtin.debug:
    msg: "Node {{ node_to_remove }} not found in cluster, skipping removal"
  when:
    - node_exists_check is reachable
    - node_exists_check.rc != 0

- name: Process node removal
  when:
    - node_exists_check is reachable
    - node_exists_check.rc == 0
  ignore_unreachable: true
  block:
    - name: Get current job count on node
      ansible.builtin.shell:
        cmd: |
          set -o pipefail
          squeue -w {{ node_to_remove }} -h | wc -l
      register: current_jobs
      changed_when: false
      delegate_to: "{{ ctld_list[0] }}"

    - name: Display job information
      ansible.builtin.debug:
        msg: "Node {{ node_to_remove }} currently has {{ current_jobs.stdout }} running job(s)"

    - name: Populate busy_nodes list
      ansible.builtin.set_fact:
        busy_nodes: "{{ (busy_nodes | default({})) | combine({node_to_remove: current_jobs.stdout | int}) }}"
      when:
        - current_jobs.stdout | int > 0

    - name: Display busy_nodes list
      ansible.builtin.debug:
        var: busy_nodes

  rescue:
    - name: Failure to detect busy nodes
      ansible.builtin.debug:
        msg: "Node {{ node_to_remove }} busy node detection failed from slurm cluster,
          as task {{ ansible_failed_task.name }} failed."


================================================
FILE: discovery/roles/slurm_config/tasks/drain_and_remove_node.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
- name: Check if node exists in Slurm cluster
  ansible.builtin.command: scontrol show node {{ node_to_remove }}
  register: node_exists_check
  failed_when: false
  ignore_unreachable: true
  changed_when: false
  delegate_to: "{{ ctld_list[0] }}"

- name: Skip if node does not exist
  ansible.builtin.debug:
    msg: "Node {{ node_to_remove }} not found in cluster, skipping removal"
  when:
    - node_exists_check is reachable
    - node_exists_check.rc != 0

- name: Process node removal
  when:
    - node_exists_check is reachable
    - node_exists_check.rc == 0
  ignore_unreachable: true
  block:
    - name: Get current job count on node
      ansible.builtin.shell:
        cmd: |
          set -o pipefail
          squeue -w {{ node_to_remove }} -h | wc -l
      register: current_jobs
      changed_when: false
      delegate_to: "{{ ctld_list[0] }}"

    - name: Display job information
      ansible.builtin.debug:
        msg: "Node {{ node_to_remove }} currently has {{ current_jobs.stdout }} running job(s)"

    - name: Force cancel jobs on the node to be removed from cluster
      ansible.builtin.command: scancel -f -w {{ node_to_remove }} # Safe does not fail if no jobs are running
      changed_when: true
      register: scancel_result
      failed_when: scancel_result.rc != 0
      delegate_to: "{{ ctld_list[0] }}"

    - name: Set node to DOWN state
      ansible.builtin.command: >
        scontrol update NodeName={{ node_to_remove }}
        State=DOWN
        Reason="Node removed from cluster via OMNIA discovery.yml"
      changed_when: true
      failed_when: false
      delegate_to: "{{ ctld_list[0] }}"
      when: node_exists_check.rc == 0

    - name: Stop the slurmd service on node
      ansible.builtin.service:
        name: slurmd
        state: stopped
      delegate_to: "{{ node_to_remove }}"
      ignore_unreachable: true
      failed_when: false

    - name: Delete the dir from NFS
      ansible.builtin.file:
        path: "{{ slurm_config_path }}/{{ node_to_remove }}"
        state: absent
  rescue:
    - name: Failure to remove node
      ansible.builtin.fail:
        msg: "Node {{ node_to_remove }} failed to be removed from slurm cluster,
          as task {{ ansible_failed_task.name }} failed."


================================================
FILE: discovery/roles/slurm_config/tasks/exist_dir.yml
================================================
#  Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
# Create directories if not exist
- name: Check if directories exist
  ansible.builtin.stat:
    path: "{{ slurm_config_path }}/{{ item[0] }}{{ item[1] }}"
  loop: "{{ product }}"
  register: existing_dir

- name: Create directories if not exist
  ansible.builtin.file: # noqa: risky-file-permissions
    path: "{{ slurm_config_path }}/{{ item.item.0 }}{{ item.item.1 }}"
    state: directory
  loop: "{{ existing_dir.results }}"
  when: not item.stat.exists


================================================
FILE: discovery/roles/slurm_config/tasks/extract_path_overrides.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# ── Extract merged dicts ──────────────────────────────────────────────

- name: Extract slurm.conf merged dict
  ansible.builtin.set_fact:
    slurm_merged_dict: "{{ (merged_conf.results | selectattr('item.key', 'equalto', 'slurm') | first).conf_dict }}"
  when: "'slurm' in conf_merge_dict"

- name: Extract slurmdbd.conf merged dict
  ansible.builtin.set_fact:
    slurmdbd_merged_dict: "{{ (merged_conf.results | selectattr('item.key', 'equalto', 'slurmdbd') | first).conf_dict }}"
  when: "'slurmdbd' in conf_merge_dict"
  no_log: "{{ _no_log }}"

- name: Extract cgroup.conf merged dict
  ansible.builtin.set_fact:
    cgroup_merged_dict: "{{ (merged_conf.results | selectattr('item.key', 'equalto', 'cgroup') | first).conf_dict }}"
  when: "'cgroup' in conf_merge_dict"

# ── slurm.conf: controller path params ────────────────────────────────

- name: Extract effective controller directories from slurm.conf
  ansible.builtin.set_fact:
    slurm_ctld_log_dir_effective: >-
      {{ (slurm_merged_dict.get('SlurmctldLogFile', ['/var/log/slurm/slurmctld.log'])
         | first if slurm_merged_dict.get('SlurmctldLogFile') is iterable
         and slurm_merged_dict.get('SlurmctldLogFile') is not string
         else slurm_merged_dict.get('SlurmctldLogFile', '/var/log/slurm/slurmctld.log'))
         | dirname }}
    slurm_state_save_location_effective: >-
      {{ (slurm_merged_dict.get('StateSaveLocation', ['/var/spool/slurmctld'])
         | first if slurm_merged_dict.get('StateSaveLocation') is iterable
         and slurm_merged_dict.get('StateSaveLocation') is not string
         else slurm_merged_dict.get('StateSaveLocation', '/var/spool/slurmctld')) }}
    slurm_ctld_pid_dir_effective: >-
      {{ (slurm_merged_dict.get('SlurmctldPidFile', ['/var/run/slurmctld.pid'])
         | first if slurm_merged_dict.get('SlurmctldPidFile') is iterable
         and slurm_merged_dict.get('SlurmctldPidFile') is not string
         else slurm_merged_dict.get('SlurmctldPidFile', '/var/run/slurmctld.pid'))
         | dirname }}
    slurm_sched_log_dir_effective: >-
      {{ ((slurm_merged_dict.get('SlurmSchedLogFile', [''])
         | first if slurm_merged_dict.get('SlurmSchedLogFile') is iterable
         and slurm_merged_dict.get('SlurmSchedLogFile') is not string
         else slurm_merged_dict.get('SlurmSchedLogFile', ''))
         | default('', true) | dirname | default('', true)) }}
  when: slurm_merged_dict is defined

# ── slurm.conf: compute path params ──────────────────────────────────

- name: Extract effective compute directories from slurm.conf
  ansible.builtin.set_fact:
    slurm_slurmd_log_dir_effective: >-
      {{ (slurm_merged_dict.get('SlurmdLogFile', ['/var/log/slurm/slurmd.log'])
         | first if slurm_merged_dict.get('SlurmdLogFile') is iterable
         and slurm_merged_dict.get('SlurmdLogFile') is not string
         else slurm_merged_dict.get('SlurmdLogFile', '/var/log/slurm/slurmd.log'))
         | dirname }}
    slurm_slurmd_spool_dir_effective: >-
      {{ (slurm_merged_dict.get('SlurmdSpoolDir', ['/var/spool/slurmd'])
         | first if slurm_merged_dict.get('SlurmdSpoolDir') is iterable
         and slurm_merged_dict.get('SlurmdSpoolDir') is not string
         else slurm_merged_dict.get('SlurmdSpoolDir', '/var/spool/slurmd')) }}
    slurm_slurmd_pid_dir_effective: >-
      {{ (slurm_merged_dict.get('SlurmdPidFile', ['/var/run/slurmd.pid'])
         | first if slurm_merged_dict.get('SlurmdPidFile') is iterable
         and slurm_merged_dict.get('SlurmdPidFile') is not string
         else slurm_merged_dict.get('SlurmdPidFile', '/var/run/slurmd.pid'))
         | dirname }}
    slurm_epilog_dir_effective: >-
      {{ (slurm_merged_dict.get('Epilog', ['/etc/slurm/epilog.d/logout_user.sh'])
         | first if slurm_merged_dict.get('Epilog') is iterable
         and slurm_merged_dict.get('Epilog') is not string
         else slurm_merged_dict.get('Epilog', '/etc/slurm/epilog.d/logout_user.sh'))
         | dirname }}
    slurm_prolog_dir_effective: >-
      {{ ((slurm_merged_dict.get('Prolog', [''])
         | first if slurm_merged_dict.get('Prolog') is iterable
         and slurm_merged_dict.get('Prolog') is not string
         else slurm_merged_dict.get('Prolog', ''))
         | default('', true) | dirname | default('', true)) }}
  when: slurm_merged_dict is defined

# ── slurm.conf: all epilog/prolog dirs and custom file paths ─────────

- name: Extract all epilog paths from merged Epilog list
  ansible.builtin.set_fact:
    slurm_epilog_paths_all: >-
      {{ (slurm_merged_dict.get('Epilog', [])
         if slurm_merged_dict.get('Epilog') is iterable
         and slurm_merged_dict.get('Epilog') is not string
         else [slurm_merged_dict.get('Epilog', '')])
         | reject('equalto', '') | list }}
    slurm_epilog_dirs_all: >-
      {{ (slurm_merged_dict.get('Epilog', [])
         if slurm_merged_dict.get('Epilog') is iterable
         and slurm_merged_dict.get('Epilog') is not string
         else [slurm_merged_dict.get('Epilog', '')])
         | map('dirname') | unique | reject('equalto', '') | list }}
  when: slurm_merged_dict is defined

- name: Extract custom epilog paths (non-default)
  ansible.builtin.set_fact:
    slurm_epilog_custom_paths: >-
      {{ slurm_epilog_paths_all | reject('search', '^/etc/slurm/epilog\\.d/') | list }}
  when: slurm_merged_dict is defined

- name: Extract all prolog paths from merged Prolog list
  ansible.builtin.set_fact:
    slurm_prolog_paths_all: >-
      {{ (slurm_merged_dict.get('Prolog', [])
         if slurm_merged_dict.get('Prolog') is iterable
         and slurm_merged_dict.get('Prolog') is not string
         else [slurm_merged_dict.get('Prolog', '')])
         | reject('equalto', '') | list }}
    slurm_prolog_dirs_all: >-
      {{ (slurm_merged_dict.get('Prolog', [])
         if slurm_merged_dict.get('Prolog') is iterable
         and slurm_merged_dict.get('Prolog') is not string
         else [slurm_merged_dict.get('Prolog', '')])
         | map('dirname') | unique | reject('equalto', '') | list }}
  when: slurm_merged_dict is defined

- name: Extract custom prolog paths (non-default)
  ansible.builtin.set_fact:
    slurm_prolog_custom_paths: >-
      {{ slurm_prolog_paths_all | list }}
  when: slurm_merged_dict is defined

# ── slurm.conf: plugin dir (both controller and compute) ─────────────

- name: Extract effective plugin directory from slurm.conf
  ansible.builtin.set_fact:
    slurm_plugin_dir_effective: >-
      {{ (slurm_merged_dict.get('PluginDir', ['/usr/lib64/slurm'])
         | first if slurm_merged_dict.get('PluginDir') is iterable
         and slurm_merged_dict.get('PluginDir') is not string
         else slurm_merged_dict.get('PluginDir', '/usr/lib64/slurm')) }}
  when: slurm_merged_dict is defined

# ── slurmdbd.conf path params ────────────────────────────────────────

- name: Extract effective directories from slurmdbd.conf
  ansible.builtin.set_fact:
    slurmdbd_log_dir_effective: >-
      {{ (slurmdbd_merged_dict.get('LogFile', ['/var/log/slurm/slurmdbd.log'])
         | first if slurmdbd_merged_dict.get('LogFile') is iterable
         and slurmdbd_merged_dict.get('LogFile') is not string
         else slurmdbd_merged_dict.get('LogFile', '/var/log/slurm/slurmdbd.log'))
         | dirname }}
    slurmdbd_pid_dir_effective: >-
      {{ (slurmdbd_merged_dict.get('PidFile', ['/var/run/slurmdbd.pid'])
         | first if slurmdbd_merged_dict.get('PidFile') is iterable
         and slurmdbd_merged_dict.get('PidFile') is not string
         else slurmdbd_merged_dict.get('PidFile', '/var/run/slurmdbd.pid'))
         | dirname }}
    slurmdbd_plugin_dir_effective: >-
      {{ (slurmdbd_merged_dict.get('PluginDir', ['/usr/lib64/slurm'])
         | first if slurmdbd_merged_dict.get('PluginDir') is iterable
         and slurmdbd_merged_dict.get('PluginDir') is not string
         else slurmdbd_merged_dict.get('PluginDir', '/usr/lib64/slurm')) }}
  when: slurmdbd_merged_dict is defined

# ── cgroup.conf path params ──────────────────────────────────────────

- name: Extract effective cgroup mountpoint from cgroup.conf
  ansible.builtin.set_fact:
    slurm_cgroup_mountpoint_effective: >-
      {{ ((cgroup_merged_dict.get('CgroupMountpoint', [''])
         | first if cgroup_merged_dict.get('CgroupMountpoint') is iterable
         and cgroup_merged_dict.get('CgroupMountpoint') is not string
         else cgroup_merged_dict.get('CgroupMountpoint', ''))
         | default('', true)) }}
  when: cgroup_merged_dict is defined

# ── Defaults when confs are not merged ────────────────────────────────

- name: Set default effective directories if slurm.conf not merged
  ansible.builtin.set_fact:
    slurm_ctld_log_dir_effective: "/var/log/slurm"
    slurm_slurmd_log_dir_effective: "/var/log/slurm"
    slurm_state_save_location_effective: "/var/spool/slurmctld"
    slurm_slurmd_spool_dir_effective: "/var/spool/slurmd"
    slurm_ctld_pid_dir_effective: "/var/run"
    slurm_slurmd_pid_dir_effective: "/var/run"
    slurm_epilog_dir_effective: "/etc/slurm/epilog.d"
    slurm_prolog_dir_effective: ""
    slurm_sched_log_dir_effective: ""
    slurm_plugin_dir_effective: "/usr/lib64/slurm"
    slurm_epilog_dirs_all: ["/etc/slurm/epilog.d"]
    slurm_epilog_paths_all: ["/etc/slurm/epilog.d/logout_user.sh"]
    slurm_epilog_custom_paths: []
    slurm_prolog_dirs_all: []
    slurm_prolog_paths_all: []
    slurm_prolog_custom_paths: []
  when: slurm_merged_dict is not defined

- name: Set default effective directories if slurmdbd.conf not merged
  ansible.builtin.set_fact:
    slurmdbd_log_dir_effective: "/var/log/slurm"
    slurmdbd_pid_dir_effective: "/var/run"
    slurmdbd_plugin_dir_effective: "/usr/lib64/slurm"
  when: slurmdbd_merged_dict is not defined

- name: Set default effective cgroup mountpoint if cgroup.conf not merged
  ansible.builtin.set_fact:
    slurm_cgroup_mountpoint_effective: ""
  when: cgroup_merged_dict is not defined


================================================
FILE: discovery/roles/slurm_config/tasks/handle_extra_confs.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
- name: Add extra confs which are not handled
  slurm_conf:
    op: merge
    conf_sources: "{{ [configs_input[extra_conf]] }}"
    conf_name: "{{ extra_conf }}"
  register: ex_conf
  delegate_to: localhost
  no_log: "{{ _no_log }}"
  when:
    - "'.' not in extra_conf"

- name: Write merged .conf
  ansible.builtin.copy:
    content: "{{ ex_conf.ini_lines | join('\n') }}\n"
    dest: "{{ slurm_config_path }}/{{ ctld_list[0] }}/etc/slurm/{{ extra_conf }}.conf"
    mode: "{{ conf_file_mode }}"
    owner: "{{ slurm_user }}"
    group: "{{ slurm_user_group }}"
    remote_src: "{{ copy_from_oim }}"
  no_log: "{{ _no_log }}"
  when:
    - "'.' not in extra_conf"
    - ex_conf is success


================================================
FILE: discovery/roles/slurm_config/tasks/hpc_tools.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Create HPC tools directories on share
  ansible.builtin.file:
    path: "{{ slurm_config_path }}/hpc_tools/{{ item }}"
    state: directory
    owner: root
    group: root
    mode: "{{ common_mode }}"
  loop:
    - cuda
    - runfile
    - scripts
    - container_images
    - nvidia_sdk

- name: Deploy download_container_image.sh to NFS share
  ansible.builtin.template:
    src: "download_container_image.sh.j2"
    dest: "{{ download_container_image_path }}"
    owner: "{{ root_user }}"
    group: "{{ root_group }}"
    mode: "0755"

- name: Deploy container_image.list to NFS share
  ansible.builtin.template:
    src: "container_image.list.j2"
    dest: "{{ container_image_list_path }}"
    owner: "{{ root_user }}"
    group: "{{ root_group }}"
    mode: "0644"

- name: Set fact for pulp mirror
  ansible.builtin.set_fact:
    pulp_mirror: "{{ hostvars['localhost']['admin_nic_ip'] }}:2225"

- name: Create x86_64 package base directory
  ansible.builtin.file:
    path: "{{ packages_base_dir_x86_64 }}"
    state: directory
    mode: '{{ common_mode }}'

- name: Create aarch64 package base directory
  ansible.builtin.file:
    path: "{{ packages_base_dir_aarch64 }}"
    state: directory
    mode: '{{ common_mode }}'

- name: Create x86_64 package layout directories
  ansible.builtin.file:
    path: "{{ packages_base_dir_x86_64 }}/{{ item }}"
    state: directory
    mode: '{{ common_mode }}'
  loop: "{{ packages_layout_x86_64 }}"

- name: Create aarch64 package layout directories
  ansible.builtin.file:
    path: "{{ packages_base_dir_aarch64 }}/{{ item }}"
    state: directory
    mode: '{{ common_mode }}'
  loop: "{{ packages_layout_aarch64 }}"

- name: Print copy paths for x86_64
  ansible.builtin.debug:
    msg: "{{ print_copy_msg }}"
  loop: "{{ offline_path_x86_64 | default([]) }}"

- name: Print copy paths for aarch64
  ansible.builtin.debug:
    msg: "{{ print_copy_msg }}"
  loop: "{{ offline_path_aarch64 | default([]) }}"

- name: Check x86_64 offline package sources
  ansible.builtin.stat:
    path: "{{ item.source_path }}"
  loop: "{{ offline_path_x86_64 | default([]) }}"
  register: x86_64_offline_pkg_sources

- name: Check aarch64 offline package sources
  ansible.builtin.stat:
    path: "{{ item.source_path }}"
  loop: "{{ offline_path_aarch64 | default([]) }}"
  register: aarch64_offline_pkg_sources

- name: Copy x86_64 offline packages
  ansible.builtin.copy:
    src: "{{ item.item.source_path }}/"
    dest: "{{ item.item.dest_path }}/"
    remote_src: true
    mode: preserve
  loop: "{{ x86_64_offline_pkg_sources.results | default([]) }}"
  when:
    - item.stat.exists
    - item.item.source_path | length > 0
    - item.item.dest_path | length > 0

- name: Copy aarch64 offline packages
  ansible.builtin.copy:
    src: "{{ item.item.source_path }}/"
    dest: "{{ item.item.dest_path }}/"
    remote_src: true
    mode: preserve
  loop: "{{ aarch64_offline_pkg_sources.results | default([]) }}"
  when:
    - item.stat.exists
    - item.item.source_path | length > 0
    - item.item.dest_path | length > 0

- name: Set NFS info fact
  ansible.builtin.set_fact:
    oim_shared_path: "{{ hostvars['localhost']['oim_shared_path'] }}"

- name: Build parallel copy list for HPC tools
  ansible.builtin.set_fact:
    parallel_copy_pairs: []

- name: Check which parallel copy source directories exist
  ansible.builtin.stat:
    path: "{{ item.src }}"
  loop: "{{ parallel_copy_candidates }}"
  register: copy_source_checks
  failed_when: false

- name: Add only valid copy pairs (source exists)
  ansible.builtin.set_fact:
    parallel_copy_pairs: >-
      {{ parallel_copy_pairs +
         [[ item.item.src, item.item.dest ]] }}
  loop: "{{ copy_source_checks.results }}"
  when: item.stat.exists

- name: Parallel copy HPC tool files
  parallel_file_copy:
    copy_pairs: "{{ parallel_copy_pairs }}"
    max_workers: "{{ parallel_copy_max_workers }}"
  when: parallel_copy_pairs | length > 0


================================================
FILE: discovery/roles/slurm_config/tasks/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
- name: Load software_config.json as software_config
  ansible.builtin.include_vars:
    file: "{{ software_config_file }}"
    name: software_config

- name: Check if slurm support is true
  ansible.builtin.set_fact:
    slurm_support: "{{ software_config.softwares | selectattr('name', 'in', ['slurm', 'slurm_custom']) | list | length > 0 }}"

- name: Get the slurm hostnames
  ansible.builtin.include_tasks: read_slurm_hostnames.yml
  when: slurm_support

# This does not consider hierarchy of slurm nodes
- name: Entering the slurm configuration only if slurm in nodes.yaml
  ansible.builtin.include_tasks: create_slurm_dir.yml
  when:
    - slurm_support
    - ctld_list or (cmpt_list or login_list or compiler_login_list)


================================================
FILE: discovery/roles/slurm_config/tasks/openldap_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
- name: Set facts for openldap
  ansible.builtin.set_fact:
    openldap_config_path: "{{ share_path }}/{{ openldap_dir_name }}"

- name: Create the openldap certs directory in share
  ansible.builtin.file:
    path: "{{ openldap_config_path }}/certs"
    state: directory
    owner: root
    group: root
    mode: "{{ common_mode }}"

- name: Create the openldap ldapuser directory in share
  ansible.builtin.file:
    path: "{{ openldap_config_path }}/ldapuser"
    state: directory
    owner: root
    group: root
    mode: "{{ common_mode }}"

- name: Copy the openldap certs
  ansible.builtin.copy:
    src: "{{ auth_tls_certs_path }}"
    dest: "{{ openldap_config_path }}/certs"
    mode: "{{ hostvars['localhost']['file_permissions_644'] }}"

- name: NFS path for cloud init
  ansible.builtin.set_fact:
    cloud_init_nfs_path_openldap: "{{ nfs_server_ip }}:{{ nfs_server_path }}/openldap"


================================================
FILE: discovery/roles/slurm_config/tasks/read_node_homogeneous.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
- name: Get group name and hardware specs for homogeneous node
  ansible.builtin.set_fact:
    group_name: "{{ name_hardware_group_map[item] }}"
    group_specs: "{{ slurm_cluster[0].node_hardware_defaults[name_hardware_group_map[item]] }}"

- name: DEBUG - Show group specs being applied
  ansible.builtin.debug:
    msg:
      - "Node: {{ item }}"
      - "Group: {{ group_name }}"
      - "Sockets: {{ group_specs.sockets }}"
      - "CoresPerSocket: {{ group_specs.cores_per_socket }}"
      - "ThreadsPerCore: {{ group_specs.threads_per_core }}"
      - "RealMemory: {{ group_specs.real_memory }}"

- name: Build node parameters from user specs (no iDRAC)
  ansible.builtin.set_fact:
    proc_params: "{{ {'NodeName': item}
     | combine({'Sockets': group_specs.sockets})
     | combine({'CoresPerSocket': group_specs.cores_per_socket})
     | combine({'ThreadsPerCore': group_specs.threads_per_core})
     | combine({'RealMemory': group_specs.real_memory})
     | combine({'Gres': group_specs.gres} if group_specs.gres is defined else {}) }}"

- name: DEBUG - Show built proc_params
  ansible.builtin.debug:
    msg: "proc_params: {{ proc_params }}"

- name: Add to Nodeparam dict
  ansible.builtin.set_fact:
    node_params: "{{ node_params + [proc_params] }}"
    gpu_params: "{{ gpu_params | default({}) | combine({item: []} if group_specs.gres is defined else {}) }}"


================================================
FILE: discovery/roles/slurm_config/tasks/read_node_idrac.yml
================================================
#  Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
# TODO: RealMemory
- name: Read Processor NodeParams
  ansible.builtin.uri:
    url: "https://{{ bmc_ip_map[item] }}/redfish/v1/Systems/System.Embedded.1/Processors?$expand=*($levels=1)"
    user: "{{ bmc_username }}"
    password: "{{ bmc_password }}"
    method: GET
    force_basic_auth: true
    validate_certs: false
    return_content: true
    body_format: json
    timeout: 60
    headers:
      Accept: "application/json"
      Content-Type: "application/json"
      OData-Version: "4.0"
    status_code:
      - 200
  register: proc_info
  failed_when: false

- name: Get CPU Processors list
  ansible.builtin.set_fact:
    cpus: "{{ proc_info.json.Members | default([]) | selectattr('ProcessorType', 'equalto', 'CPU') | list }}"
    gpus: "{{ proc_info.json.Members | default([])
     | selectattr('ProcessorType', 'equalto', 'GPU')
     | selectattr('Manufacturer', 'defined')
     | selectattr('Manufacturer', 'search', '(?i)nvidia') | list }}" # TODO: other GPUs also

- name: Fallback - Read PCIe Devices for GPU detection (when no GPUs found via Processors)
  ansible.builtin.uri:
    url: "https://{{ bmc_ip_map[item] }}/redfish/v1/Chassis/System.Embedded.1/PCIeDevices"
    user: "{{ bmc_username }}"
    password: "{{ bmc_password }}"
    method: GET
    force_basic_auth: true
    validate_certs: false
    return_content: true
    body_format: json
    timeout: 60
    headers:
      Accept: "application/json"
      Content-Type: "application/json"
      OData-Version: "4.0"
    status_code:
      - 200
  register: pcie_devices
  failed_when: false
  when: gpus | length == 0

- name: Debug - Show PCIe devices structure
  ansible.builtin.debug:
    var: pcie_devices.json.Members
  when: gpus | length == 0 and pcie_devices.json.Members is defined

- name: Fallback - Extract PCIe device URLs
  ansible.builtin.set_fact:
    pcie_device_urls: "{{ pcie_devices.json.Members | default([]) | json_query('[*].\"@odata.id\"') }}"
  when: gpus | length == 0

- name: Fallback - Get PCIe Device details for GPU detection
  ansible.builtin.uri:
    url: "https://{{ bmc_ip_map[item.0] }}{{ item.1 }}"
    user: "{{ bmc_username }}"
    password: "{{ bmc_password }}"
    method: GET
    force_basic_auth: true
    validate_certs: false
    return_content: true
    body_format: json
    timeout: 60
    headers:
      Accept: "application/json"
      Content-Type: "application/json"
      OData-Version: "4.0"
    status_code:
      - 200
  register: pcie_device_details
  with_nested:
    - ["{{ item }}"]
    - "{{ pcie_device_urls | default([]) }}"
  loop_control:
    label: "{{ item.1 }}"
  failed_when: false
  when: gpus | length == 0 and pcie_device_urls is defined and pcie_device_urls | length > 0

- name: Fallback - Detect GPUs from PCIe devices
  ansible.builtin.set_fact:
    fallback_gpus: "{{ pcie_device_details.results | default([])
      | selectattr('json', 'defined')
      | map(attribute='json')
      | selectattr('ClassCode', 'defined')
      | selectattr('VendorId', 'defined')
      | selectattr('ClassCode', 'equalto', '0x0300') | list }}"
  when: gpus | length == 0

- name: Fallback - Detect GPUs from PCIe devices (additional criteria)
  ansible.builtin.set_fact:
    fallback_gpus_additional: "{{ pcie_device_details.results | default([])
      | selectattr('json', 'defined')
      | map(attribute='json')
      | selectattr('ClassCode', 'defined')
      | selectattr('VendorId', 'defined')
      | selectattr('ClassCode', 'equalto', '0x0302') | list }}"
  when: gpus | length == 0 and fallback_gpus | default([]) | length == 0

- name: Fallback - Detect GPUs from Manufacturer/Name (NVIDIA only)
  ansible.builtin.set_fact:
    fallback_gpus_manufacturer: "{{ pcie_device_details.results | default([])
      | selectattr('json', 'defined')
      | map(attribute='json')
      | selectattr('Manufacturer', 'defined')
      | selectattr('Name', 'defined')
      | selectattr('Manufacturer', 'search', '(?i)NVIDIA')
      | selectattr('Name', 'search', '(?i)GPU|RTX|TESLA|A100|H100|L40|GB') | list }}"
  when: gpus | length == 0 and fallback_gpus | default([]) | length == 0 and fallback_gpus_additional | default([]) | length == 0

- name: Fallback - Update GPUs list if PCIe detection found GPUs
  ansible.builtin.set_fact:
    gpus: "{{ (fallback_gpus | default([])) or (fallback_gpus_additional | default([])) or (fallback_gpus_manufacturer | default([])) }}"
  when: gpus | length == 0


- name: Read Memory NodeParams
  ansible.builtin.uri:
    url: "https://{{ bmc_ip_map[item] }}/redfish/v1/Systems/System.Embedded.1"
    user: "{{ bmc_username }}"
    password: "{{ bmc_password }}"
    method: GET
    force_basic_auth: true
    validate_certs: false
    return_content: true
    body_format: json
    timeout: 60
    headers:
      Accept: "application/json"
      Content-Type: "application/json"
      OData-Version: "4.0"
    status_code:
      - 200
  register: mem_info
  failed_when: false

- name: Calculate total memory in MB (GiB → MB)
  ansible.builtin.set_fact:
    total_memory_mb: "{{ (mem_info.json.MemorySummary.TotalSystemMemoryGiB | default(default_real_memory)) * 1024 | int }}"

- name: Calculate 90% of real memory
  ansible.builtin.set_fact:
    real_memory: "{{ ((total_memory_mb | float) * 0.90) | int }}"

- name: Calculate proc facts
  ansible.builtin.set_fact:
    proc_params: "{{ {'NodeName': item} | combine({'Sockets': (1 if (cpus | length == 0) else (cpus | length))})
     | combine({'CoresPerSocket': (cpus[0].TotalEnabledCores | default(default_corespersocket))})
     | combine({'ThreadsPerCore': ((cpus[0].TotalThreads | default(default_threadspercore)) // (cpus[0].TotalCores | default(1)))})
     | combine({'RealMemory': real_memory | default(default_real_memory) })
     | combine(
                {'Gres': 'gpu:' ~ (gpus | default([1]) | length | string)}
                if (gpus | default([]))
                else {}
              ) }}"

- name: Add to Nodeparam dict
  ansible.builtin.set_fact:
    node_params: "{{ (node_params | default([])) + [proc_params] }}"
    gpu_params: "{{ gpu_params | default({}) | combine({item: gpus} if gpus else {}) }}"


================================================
FILE: discovery/roles/slurm_config/tasks/read_node_idrac_group.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
- name: Initialize group discovery variables
  ansible.builtin.set_fact:
    group_name: "{{ group_item.key }}"
    group_nodes: "{{ group_item.value }}"
    discovered_specs: {}
    responsive_node: ""

- name: Try each node in group until iDRAC responds
  ansible.builtin.uri:
    url: "https://{{ bmc_ip_map[item] }}/redfish/v1/Systems/System.Embedded.1"
    user: "{{ bmc_username }}"
    password: "{{ bmc_password }}"
    method: GET
    force_basic_auth: true
    validate_certs: false
    return_content: true
    body_format: json
    timeout: 60
    headers:
      Accept: "application/json"
      Content-Type: "application/json"
      OData-Version: "4.0"
    status_code:
      - 200
  loop: "{{ group_nodes }}"
  when: responsive_node == ""
  register: idrac_results

- name: Set responsive node from successful iDRAC call
  ansible.builtin.set_fact:
    responsive_node: "{{ item.item }}"
  loop: "{{ idrac_results.results }}"
  when:
    - responsive_node == ""
    - item.status == 200

- name: Read Processor information from responsive node
  ansible.builtin.uri:
    url: "https://{{ bmc_ip_map[responsive_node] }}/redfish/v1/Systems/System.Embedded.1/Processors?$expand=*($levels=1)"
    user: "{{ bmc_username }}"
    password: "{{ bmc_password }}"
    method: GET
    force_basic_auth: true
    validate_certs: false
    return_content: true
    body_format: json
    timeout: 60
    headers:
      Accept: "application/json"
      Content-Type: "application/json"
      OData-Version: "4.0"
    status_code:
      - 200
  register: proc_info
  when: responsive_node != ""

- name: Read Memory information from responsive node
  ansible.builtin.uri:
    url: "https://{{ bmc_ip_map[responsive_node] }}/redfish/v1/Systems/System.Embedded.1"
    user: "{{ bmc_username }}"
    password: "{{ bmc_password }}"
    method: GET
    force_basic_auth: true
    validate_certs: false
    return_content: true
    body_format: json
    timeout: 60
    headers:
      Accept: "application/json"
      Content-Type: "application/json"
      OData-Version: "4.0"
    status_code:
      - 200
  register: mem_info
  when: responsive_node != ""

- name: Extract CPU and GPU information
  ansible.builtin.set_fact:
    cpus: "{{ proc_info.json.Members | default([]) | selectattr('ProcessorType', 'equalto', 'CPU') | list }}"
    gpus: "{{ proc_info.json.Members | default([])
     | selectattr('ProcessorType', 'equalto', 'GPU')
     | selectattr('Manufacturer', 'search', '(?i)nvidia') | list }}"
  when: responsive_node != ""

- name: Fallback - Get PCIe devices for GPU detection
  ansible.builtin.uri:
    url: "https://{{ bmc_ip_map[responsive_node] }}/redfish/v1/Systems/System.Embedded.1/PCIeDevices"
    user: "{{ bmc_username }}"
    password: "{{ bmc_password }}"
    method: GET
    force_basic_auth: true
    validate_certs: false
    return_content: true
    body_format: json
    timeout: 60
    headers:
      Accept: "application/json"
      Content-Type: "application/json"
      OData-Version: "4.0"
    status_code:
      - 200
  register: pcie_devices
  failed_when: false
  when: responsive_node != "" and gpus | length == 0

- name: Fallback - Extract PCIe device URLs
  ansible.builtin.set_fact:
    pcie_device_urls: "{{ pcie_devices.json.Members | default([]) | json_query('[*].\"@odata.id\"') }}"
  when: responsive_node != "" and gpus | length == 0

- name: Fallback - Get PCIe Device details for GPU detection
  ansible.builtin.uri:
    url: "https://{{ bmc_ip_map[responsive_node] }}{{ item }}"
    user: "{{ bmc_username }}"
    password: "{{ bmc_password }}"
    method: GET
    force_basic_auth: true
    validate_certs: false
    return_content: true
    body_format: json
    timeout: 60
    headers:
      Accept: "application/json"
      Content-Type: "application/json"
      OData-Version: "4.0"
    status_code:
      - 200
  register: pcie_device_details
  loop: "{{ pcie_device_urls | default([]) }}"
  loop_control:
    label: "{{ item }}"
  failed_when: false
  when: responsive_node != "" and gpus | length == 0 and pcie_device_urls is defined and pcie_device_urls | length > 0

- name: Fallback - Detect GPUs from PCIe devices
  ansible.builtin.set_fact:
    fallback_gpus: "{{ pcie_device_details.results | default([])
      | selectattr('json', 'defined')
      | map(attribute='json')
      | selectattr('ClassCode', 'defined')
      | selectattr('VendorId', 'defined')
      | selectattr('ClassCode', 'equalto', '0x0300') | list }}"
  when: responsive_node != "" and gpus | length == 0

- name: Fallback - Detect GPUs from PCIe devices (additional criteria)
  ansible.builtin.set_fact:
    fallback_gpus_additional: "{{ pcie_device_details.results | default([])
      | selectattr('json', 'defined')
      | map(attribute='json')
      | selectattr('ClassCode', 'defined')
      | selectattr('VendorId', 'defined')
      | selectattr('ClassCode', 'equalto', '0x0302') | list }}"
  when: responsive_node != "" and gpus | length == 0 and fallback_gpus | default([]) | length == 0

- name: Fallback - Detect GPUs from Manufacturer/Name (NVIDIA only)
  ansible.builtin.set_fact:
    fallback_gpus_manufacturer: "{{ pcie_device_details.results | default([])
      | selectattr('json', 'defined')
      | map(attribute='json')
      | selectattr('Manufacturer', 'defined')
      | selectattr('Name', 'defined')
      | selectattr('Manufacturer', 'search', '(?i)NVIDIA')
      | selectattr('Name', 'search', '(?i)GPU|RTX|TESLA|A100|H100|L40|GB') | list }}"
  when: responsive_node != "" and gpus | length == 0 and fallback_gpus | default([]) | length == 0 and fallback_gpus_additional | default([]) | length == 0

- name: Fallback - Update GPUs list if PCIe detection found GPUs
  ansible.builtin.set_fact:
    gpus: "{{ (fallback_gpus | default([])) or (fallback_gpus_additional | default([])) or (fallback_gpus_manufacturer | default([])) }}"
  when: responsive_node != "" and gpus | length == 0

- name: Calculate total memory in MB (GiB → MB)
  ansible.builtin.set_fact:
    total_memory_mb: "{{ (mem_info.json.MemorySummary.TotalSystemMemoryGiB | default(default_real_memory)) * 1024 | int }}"
  when: responsive_node != ""

- name: Calculate 90% of real memory
  ansible.builtin.set_fact:
    real_memory: "{{ ((total_memory_mb | float) * 0.90) | int }}"
  when: responsive_node != ""

- name: Build discovered hardware specs
  ansible.builtin.set_fact:
    discovered_specs: "{{ {
      'sockets': (1 if (cpus | length == 0) else (cpus | length)),
      'cores_per_socket': (cpus[0].TotalEnabledCores | default(default_corespersocket)),
      'threads_per_core': ((cpus[0].TotalThreads | default(default_threadspercore)) // (cpus[0].TotalCores | default(1))),
      'real_memory': real_memory | default(default_real_memory),
      'gres': ('gpu:' ~ (gpus | default([1]) | length | string) if (gpus | default([])) else '')
    } }}"
  when: responsive_node != ""

- name: Apply discovered specs to all nodes in group
  ansible.builtin.set_fact:
    node_params: >-
      {{
        node_params + [
          {'NodeName': hostname,
           'Sockets': discovered_specs.sockets,
           'CoresPerSocket': discovered_specs.cores_per_socket,
           'ThreadsPerCore': discovered_specs.threads_per_core,
           'RealMemory': discovered_specs.real_memory}
          | combine({'Gres': discovered_specs.gres} if discovered_specs.gres != '' else {})
        ]
      }}
  loop: "{{ group_nodes }}"
  loop_control:
    loop_var: hostname
  when: discovered_specs | length > 0

- name: Use default values for all nodes in group (iDRAC failed)
  ansible.builtin.set_fact:
    node_params: >-
      {{
        node_params + [{
          'NodeName': hostname,
          'Sockets': default_corespersocket,
          'CoresPerSocket': default_corespersocket,
          'ThreadsPerCore': default_threadspercore,
          'RealMemory': default_real_memory
        }]
      }}
  loop: "{{ group_nodes }}"
  loop_control:
    loop_var: hostname
  when: discovered_specs | length == 0


================================================
FILE: discovery/roles/slurm_config/tasks/read_slurm_hostnames.yml
================================================
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
- name: Slurp remote YAML file
  ansible.builtin.slurp:
    src: "{{ nodes_yaml }}"
  register: slurped_yaml

- name: Parse YAML into vars
  ansible.builtin.set_fact:
    node_yaml: "{{ slurped_yaml.content | b64decode | from_yaml }}"

- name: Build hostname to GROUP_NAME mapping from existing PXE mapping
  ansible.builtin.set_fact:
    name_hardware_group_map: >-
      {{
        dict(
          hostvars['localhost']['pxe_mapping_dict'].dict.values() | map(attribute='HOSTNAME') | list
          | zip(hostvars['localhost']['pxe_mapping_dict'].dict.values() | map(attribute='GROUP_NAME') | list)
        )
      }}
  when: hostvars['localhost']['pxe_mapping_dict'] is defined

- name: Set empty mapping if PXE mapping not available
  ansible.builtin.set_fact:
    name_hardware_group_map: {}
  when: hostvars['localhost']['pxe_mapping_dict'] is not defined

- name: Read the node name group
  ansible.builtin.set_fact:
    name_group_map: "{{ node_yaml.nodes | items2dict(key_name='name', value_name='group') }}"

- name: Group the functional_groups
  ansible.builtin.set_fact:
    tmp_grouped_nodes: "{{ name_group_map | dict2items | groupby('value') }}"

- name: Re-organize the groups
  ansible.builtin.set_fact:
    grouped_nodes: "{{ grouped_nodes | default({}) | combine({item[0]: ((item[1] | items2dict).keys() | list)}) }}"
  loop: "{{ tmp_grouped_nodes }}"

- name: Get name and IP mapping 1
  ansible.builtin.set_fact:
    tmp_ip_name_map: "{{ node_yaml.nodes | items2dict(key_name='name', value_name='interfaces') }}"

- name: Get name and IP mapping 2
  ansible.builtin.set_fact:
    ip_name_map: "{{ ip_name_map | default({}) | combine({item.key: item.value[0]['ip_addrs'][0]['ip_addr']}) }}"
  loop: "{{ tmp_ip_name_map | dict2items }}"

- name: Get bmc_ip
  ansible.builtin.set_fact:
    bmc_ip_map: "{{ node_yaml.nodes | items2dict(key_name='name', value_name='bmc_ip') }}"
    name_ip_map: "{{ dict(ip_name_map.values() | zip(ip_name_map.keys())) }}"

- name: Assign slurm lists
  ansible.builtin.set_fact:
    ctld_list: "{{ grouped_nodes | dict2items
                   | selectattr('key', 'match', '^' ~ 'slurm_control_node_')
                   | map(attribute='value') | list | flatten }}"
    dbd_list: "{{ grouped_nodes | dict2items
                   | selectattr('key', 'match', '^' ~ 'slurm_control_node_')
                   | map(attribute='value') | list | flatten }}"
    cmpt_list: "{{ grouped_nodes | dict2items
                   | selectattr('key', 'match', '^' ~ 'slurm_node_')
                   | map(attribute='value') | list | flatten }}"
    login_list: "{{ grouped_nodes | dict2items
                   | selectattr('key', 'match', '^' ~ 'login_node_')
                   | map(attribute='value') | list | flatten }}"
    compiler_login_list: "{{ grouped_nodes | dict2items
                   | selectattr('key', 'match', '^login_compiler_node_')
                   | map(attribute='value') | list | flatten }}"

- name: Fail if Slurm controller list is empty
  ansible.builtin.fail:
    msg: "{{ controller_empty_msg }}"
  when:
    - ctld_list | length == 0

- name: Extract slurm controller IP
  ansible.builtin.set_fact:
    controller_ip: "{{ ip_name_map[ctld_list | first] }}"
  when: ctld_list | length > 0


================================================
FILE: discovery/roles/slurm_config/tasks/remove_node.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
- name: Check if controller is reachable via SSH
  ansible.builtin.wait_for:
    host: "{{ ctld_list[0] }}"
    port: 22 # TODO: make it configurable
    timeout: 10
    state: started
  delegate_to: localhost
  register: ssh_check
  ignore_errors: true

- name: Drain and remove nodes if any
  ansible.builtin.include_tasks: drain_and_remove_node.yml
  loop: "{{ nodes_in_normal_not_in_cmpt }}"
  loop_control:
    loop_var: node_to_remove
  when:
    - ssh_check is success
    - nodes_in_normal_not_in_cmpt is defined
    - nodes_in_normal_not_in_cmpt | length > 0

- name: Remove nodes from NodeName list that are not in cmpt_list
  ansible.builtin.set_fact:
    filtered_nodenames: "{{ slurm_conf_dict.NodeName | rejectattr('NodeName', 'in', nodes_in_normal_not_in_cmpt) | list }}"
  when:
    - "'slurm' in conf_merge_dict"
    - nodes_in_normal_not_in_cmpt is defined
    - nodes_in_normal_not_in_cmpt | length > 0

- name: Update slurm_conf_dict with filtered NodeName list
  ansible.builtin.set_fact:
    slurm_conf_dict: "{{ slurm_conf_dict | combine({'NodeName': filtered_nodenames}) }}"
  when:
    - "'slurm' in conf_merge_dict"
    - filtered_nodenames is defined

- name: Set partition nodes exactly as cmpt_list minus removed nodes
  ansible.builtin.set_fact:
    partition_nodes: "{{ cmpt_list | difference(nodes_in_normal_not_in_cmpt) | union(busy_nodes.keys() | default([]) | list) }}"
  when:
    - "'slurm' in conf_merge_dict"
    - nodes_in_normal_not_in_cmpt is defined
    - nodes_in_normal_not_in_cmpt | length > 0

- name: Update normal partition Nodes to match cmpt_list
  ansible.builtin.set_fact:
    updated_partitions: "{{ updated_partitions | default([])
      + [item | combine({'Nodes': (partition_nodes | join(','))
      if partition_nodes | length > 0 else slurm_partition_name})
      if item.PartitionName == slurm_partition_name else item] }}"
  loop: "{{ slurm_conf_dict.PartitionName | default([]) }}"
  when:
    - "'slurm' in conf_merge_dict"
    - nodes_in_normal_not_in_cmpt is defined
    - nodes_in_normal_not_in_cmpt | length > 0

- name: Update slurm_conf_dict with updated partitions
  ansible.builtin.set_fact:
    slurm_conf_dict: "{{ slurm_conf_dict | combine({'PartitionName': updated_partitions}) }}"
  when:
    - "'slurm' in conf_merge_dict"
    - updated_partitions is defined

- name: Convert slurm conf to ini
  slurm_conf:
    op: render
    conf_name: slurm
    conf_map: "{{ slurm_conf_dict }}"
  register: slurm_conf_ini

- name: Update merged_conf results with new ini_lines for slurm
  ansible.builtin.set_fact:
    updated_merged_results: "{{ updated_merged_results | default([])
     + [item | combine({'ini_lines': slurm_conf_ini.ini_lines}) if item.item.key == 'slurm' else item] }}"
  loop: "{{ merged_conf.results }}"
  when:
    - slurm_conf_ini is defined
    - slurm_conf_ini.ini_lines is defined

- name: Replace merged_conf with updated results
  ansible.builtin.set_fact:
    merged_conf: "{{ merged_conf | combine({'results': updated_merged_results}) }}"
  when:
    - updated_merged_results is defined


================================================
FILE: discovery/roles/slurm_config/tasks/storage.yml
================================================
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
- name: Include storage vars
  ansible.builtin.include_vars: "{{ input_project_dir }}/storage_config.yml"

- name: Set facts for slurm
  ansible.builtin.set_fact:
    nfs_storage_name: "{{ slurm_cluster[0].nfs_storage_name }}"

- name: Read the slurm mount point
  ansible.builtin.set_fact:
    share_path: "{{ (nfs_client_params | selectattr('nfs_name', 'equalto', nfs_storage_name) | first).client_share_path }}"


================================================
FILE: discovery/roles/slurm_config/tasks/update_hosts_munge.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
- name: Edit /etc/hosts file till DNS
  ignore_unreachable: true
  delegate_to: "{{ slurmhost_ip }}"
  block:
    - name: Remove deleted nodes if any hostname exists in /etc/hosts
      ansible.builtin.lineinfile:
        path: "/etc/hosts"
        regexp: '(\b{{ node_to_remove }}\b)'
        state: absent
      loop: "{{ nodes_in_normal_not_in_cmpt }}"
      loop_control:
        loop_var: node_to_remove
      when:
        - nodes_in_normal_not_in_cmpt is defined
        - nodes_in_normal_not_in_cmpt | length > 0

    - name: Remove existing /etc/hosts entries containing the IP or hostname
      ansible.builtin.lineinfile:
        path: "/etc/hosts"
        regexp: '(\b{{ host_entry.value }}\b|\b{{ host_entry.key }}\b)'
        state: absent
      loop: "{{ ip_name_map | dict2items | list }}"
      loop_control:
        loop_var: host_entry

    - name: Add correct /etc/hosts entry for controller hostname and IP
      ansible.builtin.lineinfile:
        path: "/etc/hosts"
        line: "{{ host_entry.value }} {{ host_entry.key }}"
        state: present
        mode: '0644'
        create: true
      loop: "{{ ip_name_map | dict2items | list }}"
      loop_control:
        loop_var: host_entry
  rescue:
    - name: Print error if editing /etc/hosts fails
      ansible.builtin.debug:
        msg: "Failed to edit /etc/hosts file on {{ slurmhost_ip }}"

- name: Get munge changes
  ansible.builtin.set_fact:
    munge_key_changed: "{{ munge_key_copy.results | default([]) | rekey_on_member('item') }}"
  when: munge_key_copy is defined

- name: Block when munge key changed
  ansible.builtin.debug:
    msg: "Munge key updates detected on NFS for {{ slurmhost_ip }}\n.
     Please restart munge service on {{ slurmhost_ip }} followed by the dependent slurm services on them\n."
  when:
    - munge_key_changed is defined
    - munge_key_changed[name_ip_map[slurmhost_ip]]['changed'] | default(false)
    - restart_slurm_services
  no_log: "{{ _no_log }}"
  ignore_unreachable: true


================================================
FILE: discovery/roles/slurm_config/tasks/validate_path_overrides.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# ── slurm.conf path validation ───────────────────────────────────────

- name: Validate slurm.conf path parameters are absolute
  ansible.builtin.fail:
    msg: "slurm.conf {{ item }} must be an absolute path (start with /). Current value: {{ slurm_merged_dict.get(item) }}"
  when:
    - slurm_merged_dict is defined
    - slurm_merged_dict.get(item) is defined
    - slurm_merged_dict.get(item) is not none
    - >-
      (slurm_merged_dict.get(item) is string
       and slurm_merged_dict.get(item) | length > 0)
      or (slurm_merged_dict.get(item) is iterable
          and slurm_merged_dict.get(item) | list | length > 0)
    - >-
      not ((slurm_merged_dict.get(item) is string
            and slurm_merged_dict.get(item) | regex_search('^/'))
           or (slurm_merged_dict.get(item) is iterable
               and (slurm_merged_dict.get(item) | first) | regex_search('^/')))
  loop:
    - SlurmctldLogFile
    - SlurmdLogFile
    - StateSaveLocation
    - SlurmdSpoolDir
    - SlurmctldPidFile
    - SlurmdPidFile
    - Epilog
    - Prolog
    - EpilogSlurmctld
    - PrologSlurmctld
    - SlurmSchedLogFile
    - PluginDir
    - PlugStackConfig
    - SrunEpilog
    - SrunProlog
    - TaskEpilog
    - TaskProlog
    - HealthCheckProgram
    - RebootProgram
    - UnkillableStepProgram
    - ResvEpilog
    - ResvProlog
    - TmpFS
    - JobCompLoc
    - JobCredentialPrivateKey
    - JobCredentialPublicCertificate

# ── slurmdbd.conf path validation ────────────────────────────────────

- name: Validate slurmdbd.conf path parameters are absolute
  ansible.builtin.fail:
    msg: "slurmdbd.conf {{ item }} must be an absolute path (start with /). Current value: {{ slurmdbd_merged_dict.get(item) }}"
  when:
    - slurmdbd_merged_dict is defined
    - slurmdbd_merged_dict.get(item) is defined
    - slurmdbd_merged_dict.get(item) is not none
    - >-
      (slurmdbd_merged_dict.get(item) is string
       and slurmdbd_merged_dict.get(item) | length > 0)
      or (slurmdbd_merged_dict.get(item) is iterable
          and slurmdbd_merged_dict.get(item) | list | length > 0)
    - >-
      not ((slurmdbd_merged_dict.get(item) is string
            and slurmdbd_merged_dict.get(item) | regex_search('^/'))
           or (slurmdbd_merged_dict.get(item) is iterable
               and (slurmdbd_merged_dict.get(item) | first) | regex_search('^/')))
  loop:
    - LogFile
    - PidFile
    - PluginDir

# ── cgroup.conf path validation ──────────────────────────────────────

- name: Validate cgroup.conf path parameters are absolute
  ansible.builtin.fail:
    msg: "cgroup.conf {{ item }} must be an absolute path (start with /). Current value: {{ cgroup_merged_dict.get(item) }}"
  when:
    - cgroup_merged_dict is defined
    - cgroup_merged_dict.get(item) is defined
    - cgroup_merged_dict.get(item) is not none
    - >-
      (cgroup_merged_dict.get(item) is string
       and cgroup_merged_dict.get(item) | length > 0)
      or (cgroup_merged_dict.get(item) is iterable
          and cgroup_merged_dict.get(item) | list | length > 0)
    - >-
      not ((cgroup_merged_dict.get(item) is string
            and cgroup_merged_dict.get(item) | regex_search('^/'))
           or (cgroup_merged_dict.get(item) is iterable
               and (cgroup_merged_dict.get(item) | first) | regex_search('^/')))
  loop:
    - CgroupMountpoint


================================================
FILE: discovery/roles/slurm_config/templates/all_other.conf.j2
================================================
{% set conf_dict = lookup('vars', item) %}
{% for key in conf_dict | sort %}
{% set val = conf_dict[key] %}
{% if val is not none and val != omit %}
{{ key }}={{ 'yes' if val is sameas true else ('no' if val is sameas false else val) }}
{% endif %}
{% endfor %}

================================================
FILE: discovery/roles/slurm_config/templates/container_image.list.j2
================================================
# Container Image List
# This file contains container images to be downloaded as SIF files
# Format: <registry>/<namespace>/<image>:<tag>
# Lines starting with # are comments and will be ignored
# Empty lines are also ignored
#
# Examples:
#   nvcr.io/nvidia/hpc-benchmarks:25.09
#   docker.io/library/ubuntu:22.04
#   ghcr.io/apptainer/apptainer:latest

# Default HPC Benchmarks image
nvcr.io/nvidia/hpc-benchmarks:25.09

================================================
FILE: discovery/roles/slurm_config/templates/download_container_image.sh.j2
================================================
#!/bin/bash
# Generic container image download script (SIF format) - Pulp only
# Deployed via NFS share for all nodes
# Reads container images from container_image.list file and downloads them as SIF files
# Downloads from Pulp mirror only (no internet fallback)
# Usage: download_container_image.sh

LOGFILE="/var/log/container_image_download.log"
exec > >(tee -a "$LOGFILE") 2>&1

# Configuration
SCRIPT_DIR="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
CONTAINER_IMAGE_LIST="${SCRIPT_DIR}/container_image.list"
DOWNLOAD_DIR="/hpc_tools/container_images"
PULP_SERVER="{{ hostvars['localhost']['admin_nic_ip'] }}:2225"

echo "===== Starting Container Image Download Script (Pulp Only) ====="
echo "[INFO] Timestamp: $(date)"

# Check if Apptainer is installed
echo "[INFO] Checking Apptainer installation..."
if ! command -v apptainer &>/dev/null; then
    echo "[ERROR] Apptainer is not installed. Please install Apptainer first."
    exit 1
fi
echo "[SUCCESS] Apptainer is installed."
apptainer --version

# Check if container image list file exists
if [ ! -f "$CONTAINER_IMAGE_LIST" ]; then
    echo "[ERROR] Container image list file not found: $CONTAINER_IMAGE_LIST"
    echo "[INFO] Please create the file with one image URI per line."
    echo "[INFO] Example format: nvcr.io/nvidia/hpc-benchmarks:25.09"
    exit 1
fi

# Navigate to download directory
mkdir -p "$DOWNLOAD_DIR"

echo "[INFO] Download directory: $DOWNLOAD_DIR"

if [ ! -d "$DOWNLOAD_DIR" ]; then
    echo "[ERROR] Download directory does not exist: $DOWNLOAD_DIR"
    exit 1
fi

cd "$DOWNLOAD_DIR" || {
    echo "[ERROR] Failed to change directory to $DOWNLOAD_DIR"
    exit 1
}

# Clear pull log at start of run
echo "===== Container Image Pull Log =====" > /var/log/apptainer_pull.log
echo "Started: $(date)" >> /var/log/apptainer_pull.log

echo "[INFO] Processing images from list file: $CONTAINER_IMAGE_LIST"

TOTAL_IMAGES=0
SUCCESS_COUNT=0
FAILED_COUNT=0
FAILED_IMAGES=""

while IFS= read -r line || [ -n "$line" ]; do
    # Skip empty lines and comments
    [[ -z "$line" || "$line" =~ ^[[:space:]]*# ]] && continue
    
    # Trim whitespace
    line=$(echo "$line" | xargs)
    
    # Add docker:// prefix if not present
    if [[ ! "$line" =~ ^docker:// ]]; then
        CONTAINER_REGISTRY="docker://$line"
    else
        CONTAINER_REGISTRY="$line"
    fi
    
    # Auto-generate SIF filename from image URI
    TAG=$(echo "$CONTAINER_REGISTRY" | grep -oP '(?<=:)[^:]+$' || echo "latest")
    IMAGE_NAME=$(echo "$CONTAINER_REGISTRY" | sed 's|docker://||' | rev | cut -d'/' -f1 | rev | cut -d':' -f1)
    CONTAINER_IMAGE="${IMAGE_NAME}_${TAG}.sif"
    
    ((TOTAL_IMAGES++))
    
    echo ""
    echo "===== Processing Image $TOTAL_IMAGES: $line ====="
    echo "[INFO] Image URI: $CONTAINER_REGISTRY"
    echo "[INFO] Output file: $CONTAINER_IMAGE"
    echo "[INFO] Destination: $DOWNLOAD_DIR/$CONTAINER_IMAGE"
    
    # Pull container image from Pulp mirror only
    echo "[INFO] Pulling container image from Pulp mirror..."
    echo "[INFO] Pulp mirror: $PULP_SERVER"

    if [ -f "$DOWNLOAD_DIR/$CONTAINER_IMAGE" ]; then
        echo "[WARN] Container image already exists: $CONTAINER_IMAGE"
        echo "[INFO] Skipping download. Remove the file to re-download."
        ((SUCCESS_COUNT++))
    else
        # Append separator and timestamp to pull log
        echo "" >> /var/log/apptainer_pull.log
        echo "========================================" >> /var/log/apptainer_pull.log
        echo "Image: $line" >> /var/log/apptainer_pull.log
        echo "Timestamp: $(date)" >> /var/log/apptainer_pull.log
        echo "========================================" >> /var/log/apptainer_pull.log

        # Extract registry and path from image URI
        # e.g., docker://nvcr.io/nvidia/hpc-benchmarks:25.09 -> nvcr.io/nvidia/hpc-benchmarks:25.09
        IMAGE_PATH="${CONTAINER_REGISTRY#docker://}"

        # Strip registry prefix (e.g., nvcr.io/, ghcr.io/, docker.io/) for Pulp URL
        # Pulp stores images without the registry prefix
        # e.g., nvcr.io/nvidia/hpc-benchmarks:25.09 -> nvidia/hpc-benchmarks:25.09
        IMAGE_PATH_NO_REGISTRY=$(echo "$IMAGE_PATH" | sed 's|^[^/]*/||')

        # Construct Pulp mirror URL (without registry prefix)
        PULP_IMAGE="docker://${PULP_SERVER}/${IMAGE_PATH_NO_REGISTRY}"

        echo "[INFO] Pulling from Pulp mirror..."
        echo "[INFO] Pulp URL: $PULP_IMAGE"

        # Pull from Pulp only
        echo "Trying: PULP ($PULP_IMAGE)" >> /var/log/apptainer_pull.log
        echo "[INFO] Starting pull (this may take several minutes for large images)..."

        # Use timeout to prevent hanging (30 minutes)
        timeout 1800 apptainer pull --disable-cache --name "$CONTAINER_IMAGE" --dir "$DOWNLOAD_DIR" --tmpdir "$DOWNLOAD_DIR" "$PULP_IMAGE" 2>&1 | tee -a /var/log/apptainer_pull.log
        PULL_EXIT_CODE=$?

        # Check the actual exit code from timeout command
        if [ $PULL_EXIT_CODE -eq 124 ]; then
            echo "[ERROR] Pull timed out after 30 minutes."
            echo "[INFO] Large images may require more time. Try pulling manually or increase timeout."
            echo "Result: TIMEOUT" >> /var/log/apptainer_pull.log
            ((FAILED_COUNT++))
            FAILED_IMAGES="${FAILED_IMAGES}\n  - ${line} (TIMEOUT)"
        elif [ $PULL_EXIT_CODE -eq 0 ] && [ -f "$CONTAINER_IMAGE" ]; then
            echo "[SUCCESS] Container image pulled successfully from Pulp mirror"
            echo "[SOURCE] Downloaded from: PULP MIRROR ($PULP_SERVER)"
            echo "Result: SUCCESS (PULP)" >> /var/log/apptainer_pull.log
            ls -lh "$CONTAINER_IMAGE"
            ((SUCCESS_COUNT++))
        else
            echo "[ERROR] Failed to pull container image from Pulp mirror (exit code: $PULL_EXIT_CODE)."
            echo "[INFO] Image may not be available in Pulp or download was interrupted."
            echo "Result: FAILED" >> /var/log/apptainer_pull.log
            ((FAILED_COUNT++))
            FAILED_IMAGES="${FAILED_IMAGES}\n  - ${line}"
        fi
    fi
done < "$CONTAINER_IMAGE_LIST"

echo ""
echo "===== Container Image Download Summary ====="
echo "[INFO] Total images processed: $TOTAL_IMAGES"
echo "[INFO] Successful downloads: $SUCCESS_COUNT"
echo "[INFO] Failed downloads: $FAILED_COUNT"

if [ $FAILED_COUNT -gt 0 ]; then
    echo -e "[ERROR] Failed images:$FAILED_IMAGES"
    EXIT_CODE=1
else
    EXIT_CODE=0
fi

echo ""
echo "===== Container Image Download Completed ====="
exit ${EXIT_CODE:-0}


================================================
FILE: discovery/roles/slurm_config/templates/logout_user.sh.j2
================================================
#!/bin/bash

USER="${SLURM_JOB_USER:-$1}"
LOGFILE="/var/log/slurm_epilog.log"
TIMEOUT=10  # Max seconds to wait before force logout

log() {
    echo "[$(date)] $1" >> "$LOGFILE"
}

# Skip epilog for root or other system users
if [ "$USER" == "root" ] || [ "$USER" == "slurm" ]; then
    log "Skipping epilog for system user $USER on $(hostname)"
    exit 0
fi

log "Epilog started for $USER on $(hostname)"

# Wait for Slurm to release the job and user's other jobs to end
for i in $(seq 1 $TIMEOUT); do
    user_jobs=$(pgrep -u "$USER" | wc -l)
    if [ "$user_jobs" -eq 0 ]; then
        log "No remaining processes for $USER. Proceeding to logout."
        break
    fi
    log "Attempt $i: $USER still has $user_jobs process(es). Waiting..."
    sleep 1
done

# Final check
user_jobs=$(pgrep -u "$USER" | wc -l)
if [ "$user_jobs" -gt 0 ]; then
    log "Timeout reached. Killing remaining processes for $USER"
    pkill -KILL -u "$USER"
    sleep 1
fi

# Now check if session exists and terminate it
SESSION_ID=$(loginctl list-sessions --no-legend | awk -v user="$USER" '$3 == user { print $1 }')
if [ -n "$SESSION_ID" ]; then
    log "Found lingering session $SESSION_ID for $USER. Terminating via loginctl."
    loginctl terminate-session "$SESSION_ID" >/dev/null 2>&1 || true
else
    log "No session found for $USER — already logged out."
fi

log "Epilog complete for $USER"
exit 0


================================================
FILE: discovery/roles/slurm_config/templates/mariadb-server.cnf.j2
================================================
[mysqld]
datadir=/var/lib/mysql
socket=/var/lib/mysql/mysql.sock
log-error=/var/log/mariadb/mariadb.log
pid-file=/run/mariadb/mariadb.pid

# SlurmDBD recommended settings
innodb_buffer_pool_size={{ innodb_buffer_pool_size }}
innodb_lock_wait_timeout={{ innodb_lock_wait_timeout }}

================================================
FILE: discovery/roles/slurm_config/vars/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
ctld_list: []
cmpt_list: []
login_list: []
dbd_list: []
conf_files: # Must match this MASTER list
  - slurm
  - slurmdbd
  - cgroup
  - gres
  - acct_gather
  - helpers
  - job_container
  - mpi
  - oci
  - topology
  - burst_buffer

# Supported configuration files are:
  # slurm.conf
  # slurmdbd.conf
  # cgroup.conf
  # gres.conf
  # acct_gather.conf
  # helpers.conf
  # job_container.conf
  # mpi.conf
  # oci.conf
  # topology.conf
  # burst_buffer.conf

# Non Conf files
  # topology.yaml
  # namespace.yaml
  # plugstack.conf
  # scrun.lua
  # cli_filter.lua

copy_from_oim: false
common_dir:
  - /etc/munge
ctld_dir:
  - /etc/slurm
db_dir:
  - /etc/my.cnf.d
  - /var/lib/mysql
  - /var/log/mariadb
cmpt_dir:
  - /etc/slurm/epilog.d

innodb_buffer_pool_size: 4G
innodb_lock_wait_timeout: 900
conf_server: "--conf-server {{ ctld_list | join(',') }}"
# TODO tmp
nodes_yaml: "{{ hostvars['localhost']['oim_shared_path'] }}/omnia/openchami/workdir/nodes/nodes.yaml"
bmc_username: "{{ hostvars['localhost']['bmc_username'] }}"
bmc_password: "{{ hostvars['localhost']['bmc_password'] }}"
clear_slurm_files: false
conf_in_nfs: true
input_project_dir: "{{ hostvars['localhost']['input_project_dir'] }}"
cluster_name: cluster # TODO: direct load vars omnia_config.yml
slurm_uid: 6001
slurm_user: slurm
slurm_user_group: slurm
restart_slurm_services: "{{ hostvars['localhost']['restart_slurm_services'] | default(true) }}"
slurm_db_username: "{{ hostvars['localhost']['slurm_db_username'] | default('dbuser') }}"
slurm_db_password: "{{ hostvars['localhost']['slurm_db_password'] }}"
slurm_db_host: "{{ hostvars['localhost']['slurm_db_host'] | default(false) }}"
slurm_db_port: "{{ hostvars['localhost']['slurm_db_port'] | default(3306) }}"
slurm_db_type: "{{ hostvars['localhost']['slurm_db_type'] | default('mariadb') }}"
# share_path: "{{ hostvars['localhost']['share_path'] }}" # TODO: direct load vars omnia_config.yml
slurm_support: "{{ hostvars['localhost']['slurm_support'] }}"
slurm_share_prefix: "/"
slurm_config_dir: etc/slurm
slurm_dir_name: "slurm"
slurm_dbd_port: 6819
slurm_dbd_db_username: "{{ slurm_user }}"
slurmdbd_conf_path: "/etc/slurm/slurmdbd.conf"
slurm_db_login_unix_socket: /var/lib/mysql/mysql.sock
slurm_mysql_cnf_path: /etc/my.cnf.d/mysql-server.cnf
slurm_mariadb_cnf_path: /etc/my.cnf.d/mariadb-server.cnf
slurm_partition_name: normal
nfs_share_slurm: "nfs_share"
configless_slurm: "configless"
mariadb: mariadb
mysql: mysql
root_user: root
root_group: root
plugin_slurm_dir: "/usr/lib64/slurm"
munge_key_cmd: "dd if=/dev/urandom bs=1 count=1024"
slurm_ctld_parameters: ['enable_configless']
partitions: {}
_clean_before_install: false
_force_install_nfs: true
installroot: "/"
conf_file_mode: "0644"
slurm_mode: "0644"
munge_mode: "0400"
munge_dir_mode: "0700"
common_mode: "0755"
slurm_dbd_mode: "0600"
slurm_db_cnf_mode: "0600"
node_drain_timeout: 900
node_drain_delay: 30
force_scancel_node: false
_no_log: true
dbd_slurm_conf:
  AccountingStoragePort: "{{ slurm_dbd_port }}"
  AccountingStorageType: accounting_storage/slurmdbd
partition_params:
  PartitionName: "{{ slurm_partition_name }}"
  Nodes: "{{ cmpt_list | join(',') if cmpt_list else slurm_partition_name }}"
  MaxTime: "INFINITE"
  State: "UP"
  Default: "YES"
busy_nodes: {}
openldap_dir_name: "openldap/"
software_config_file: "{{ input_project_dir }}/software_config.json"
omnia_run_tags: "{{ hostvars['localhost']['omnia_run_tags'] }}"
auth_tls_certs_path: "/opt/omnia/auth/tls_certs/ldapserver.crt"
slurm_installation_type: configless
pulp_webserver_cert_path: "/opt/omnia/pulp/settings/certs/pulp_webserver.crt"
controller_empty_msg: "Slurm controller functional group is missing from PXE mapping file. Please update the file and rerun discovery.yml."
download_container_image_path: "{{ slurm_config_path }}/hpc_tools/scripts/download_container_image.sh"
container_image_list_path: "{{ slurm_config_path }}/hpc_tools/scripts/container_image.list"
pulp_mirror: "{{ hostvars['localhost']['admin_nic_ip'] }}:2225"
packages_base_dir_x86_64: "{{ slurm_config_path }}/packages/x86_64"
packages_base_dir_aarch64: "{{ slurm_config_path }}/packages/aarch64"
offline_repo_basepath_x86_64: "{{ oim_shared_path }}/omnia/offline_repo/cluster/x86_64/rhel/{{ hostvars['localhost']['cluster_os_version'] }}/iso"
offline_repo_basepath_aarch64: "{{ oim_shared_path }}/omnia/offline_repo/cluster/aarch64/rhel/{{ hostvars['localhost']['cluster_os_version'] }}/iso"
packages_layout_x86_64:
  - cuda
packages_layout_aarch64:
  - cuda
print_copy_msg: "Copying {{ item.name }} from {{ item.source_path }} to {{ item.dest_path }}"
offline_path_x86_64: []
offline_path_aarch64: []

ssh_private_key_path: /root/.ssh/oim_rsa

# nvidia sdk vars
# Fully resolved tarball relative paths (no nested Jinja2)
# nvidia sdk vars
nvhpc_pkg_name_x86_64: "nvhpc_2025_2511_Linux_x86_64_cuda_13.0"
nvhpc_pkg_name_aarch64: "nvhpc_2025_2511_Linux_aarch64_cuda_13.0"

nvhpc_tarball_x86_64_relpath: "offline_repo/cluster/x86_64/rhel/{{ hostvars['localhost']['cluster_os_version'] }}/tarball/{{ nvhpc_pkg_name_x86_64 }}/{{ nvhpc_pkg_name_x86_64 }}.tar.gz" # noqa: yaml[line-length]
nvhpc_tarball_aarch64_relpath: "offline_repo/cluster/aarch64/rhel/{{ hostvars['localhost']['cluster_os_version'] }}/tarball/{{ nvhpc_pkg_name_aarch64 }}/{{ nvhpc_pkg_name_aarch64 }}.tar.gz" # noqa: yaml[line-length]

nvhpc_nfs_rel_dir: "hpc_tools/nvidia_sdk"

# parallel file copy
parallel_copy_max_workers: 4

# ------------------------------------------------------------
# Parallel Copy Candidates (Only path existence matters)
# ------------------------------------------------------------

parallel_copy_candidates:

  # CUDA Runfile (aarch64 repo path)
  - name: cuda_runfile_aarch64
    src: "{{ oim_shared_path }}/omnia/offline_repo/cluster/aarch64/rhel/{{ hostvars['localhost']['cluster_os_version'] }}/iso/cuda-run/"
    dest: "{{ slurm_config_path }}/hpc_tools/runfile/"

  # CUDA Runfile (x86_64 repo path)
  - name: cuda_runfile_x86_64
    src: "{{ oim_shared_path }}/omnia/offline_repo/cluster/x86_64/rhel/{{ hostvars['localhost']['cluster_os_version'] }}/iso/cuda-run/"
    dest: "{{ slurm_config_path }}/hpc_tools/runfile/"

  # NVIDIA HPC SDK (x86_64 tarball extracted dir)
  - name: nvhpc_sdk_x86_64
    src: "{{ oim_shared_path }}/omnia/{{ nvhpc_tarball_x86_64_relpath | dirname }}/"
    dest: "{{ slurm_config_path }}/hpc_tools/nvidia_sdk/"

  - name: nvhpc_sdk_aarch64
    src: "{{ oim_shared_path }}/omnia/{{ nvhpc_tarball_aarch64_relpath | dirname }}/"
    dest: "{{ slurm_config_path }}/hpc_tools/nvidia_sdk/"

backup_dir: "{{ slurm_config_path }}/{{ ctld_list[0] }}/etc/slurm/backup_{{ ansible_date_time.date }}_{{ ansible_date_time.time | replace(':', '-') }}"


================================================
FILE: discovery/roles/telemetry/README.md
================================================
# Telemetry Role

## Overview
Configures telemetry services for HPC cluster monitoring, including iDRAC telemetry streaming and LDMS (Lightweight Distributed Metric Service).

## Purpose
- Collects hardware metrics from Dell iDRAC interfaces
- Deploys LDMS agents for system-level metrics collection
- Sets up data aggregation and storage infrastructure
- Configures Kafka for telemetry data streaming
- Deploys time-series databases for metric storage

## Key Tasks
- **Load Configuration**: Reads telemetry configuration and software config
- **Setup Prerequisites**: Creates Kubernetes namespace and RBAC resources
- **Generate Deployments**: Creates deployment manifests for telemetry services
- **Configure LDMS**: Sets up LDMS samplers and aggregators
- **Configure iDRAC**: Sets up iDRAC telemetry streamers
- **Validate Inventory**: Validates iDRAC connectivity and endpoints

## Telemetry Components
- **iDRAC Telemetry**: Collects hardware metrics (temperature, power, fan speeds) from iDRAC
- **LDMS**: Collects OS-level metrics (CPU, memory, network, disk) from compute nodes
- **Kafka**: Streams telemetry data
- **Time-Series Database**: Stores metrics (VictoriaMetrics)


================================================
FILE: discovery/roles/telemetry/files/nersc-ldms-aggr/.gitignore
================================================
manifest.yaml
values.yaml
out_dir
nersc-ldms-aggr/templates/cm.nersc-ldms-bin.yaml
nersc-ldms-aggr/templates/cm.nersc-ldms-conf.yaml


================================================
FILE: discovery/roles/telemetry/files/nersc-ldms-aggr/Makefile
================================================
.PHONY: all clean

# Check if a file named "ldms_machine_config.json" exists
ifeq (,$(wildcard ldms_machine_config.json))
    $(error ldms_machine_config.json is missing! Aborting. Create file.)
endif

# Main target
all: manifest.yaml

# Define products to be cleaned
products = out_dir \
           nersc-ldms-aggr/templates/cm.nersc-ldms-bin.yaml \
           nersc-ldms-aggr/templates/cm.nersc-ldms-conf.yaml \
           values.yaml \
           manifest.yaml

# Declare generated files depend on a common marker
out_dir/cm.nersc-ldms-bin.yaml: out_dir/.generated

out_dir/cm.nersc-ldms-conf.yaml: out_dir/.generated

out_dir/nersc-ldmsd-port-map.json: out_dir/.generated

# Marker target to run the init scripts only once
out_dir/.generated:
	@echo "Running ./make_host_map.dell.py"; \
	./make_host_map.dell.py --config=ldms_machine_config.json; \
	echo "Running ./nersc_ldms_make_ldms_config.py --config=ldms_machine_config.json"; \
	./nersc_ldms_make_ldms_config.py --config=ldms_machine_config.json
	touch $@

# Copy templates from generated files
nersc-ldms-aggr/templates/cm.nersc-ldms-bin.yaml: out_dir/cm.nersc-ldms-bin.yaml
	cp -f $< $@

nersc-ldms-aggr/templates/cm.nersc-ldms-conf.yaml: out_dir/cm.nersc-ldms-conf.yaml
	cp -f $< $@

# Generate manifest.yaml from the template
manifest.yaml: manifest.yaml.in out_dir/cm.nersc-ldms-conf.yaml out_dir/cm.nersc-ldms-bin.yaml
	./mkmanifest.py > manifest.yaml

# Clean up generated files
clean:
	rm -rf $(products)


================================================
FILE: discovery/roles/telemetry/files/nersc-ldms-aggr/README.md
================================================
Abstract
----

The LDMS Loftsman/Helm Chart enables horizontal scaling of LDMS daemons by distributing producer nodes across multiple LDMS aggregator and storage daemons.

This ensures that no single daemon is overloaded, helping to prevent data loss.

Specifically, the chart divides the list of nodes to be monitored among several ldmsd aggregator daemons (which collect data from producers) and ldmsd storage daemons (which receive data from aggregators and write to Kafka). 

This balanced distribution maximizes reliability and scalability.

This LDMS orchestration depends on a predefined list of nodes already running ldmsd with sampler plugins, provided as JSON host_map files.

Additionally, the orchestration depends on predefined Kubernetes Secrets for ldmsd communication, supporting both LDMS OVIS and Munge authentication mechanisms.

Optionally, the orchestration can use a predefined Kubernetes Secret from pulling container images from a private registry.

Prerequisites
---

1. Create a config file for your system.

```console
cp ldms_machine_config.dell.json ldms_machine_config.json
```

Key Areas: `sys_opts`, `node_types`, and `stream`

```
sys_opts: 
  system                  dell|csm, used in the Makefile to choose script that generates the host map file
  namespace               namespace to deploy into
  imagePullSecretsOption  If your container images are in a private repo, specify k8s Secret with creds to pull

node_types:               List of dict, for each node type with variables used to generate the config files

stream:                   Specific auth for the stream pod. it listens to all Aggregator pods
```

2. Create k8s Secrets for each ldmsd node type and add to the ldms_machine_config.json (in sections auth_type, auth_secret, and auth_secret_file).

3. If needed create a k8s Secrets allowing the pods to pull the image from the image registry, and add to the ldms_machine_config.json in imagePullSecretsOption).

4. Create a script to generate the host_map files.

* Use make_host_map.dell.py to generate host_map.json from a manually created source file.

5. Run Make

```console
1. Creates out_dir
2. Runs script to create host_map files
3. Runs scripts to create ldmsd files, and bundles them into a Config Map
4. Scales the Statefulset 

Use make_host_map.dell.py:
1. Copy host_map.slurm-cluster.json (or another prepared host map) to out_dir/host_map.json

Create ldms config and prepare chart (nersc_ldms_make_ldms_config.py)
1. Create `ldmsd` config and environment variable files for each `ldmsd` to distribute the producers across daemons and enable daemons to find each other.
2. Create ConfigMaps, which bundle the config and environment files, along with supporting scripts, into mountable Kubernetes objects.
3. Scale the aggregator StatefulSets to the appropriate number of `ldmsd` instances to service all producers.
4. Scale the storage StatefulSets to match the number of `ldmsd` instances needed to service all aggregators and distribute writes to Kafka.
5. Scale StatefulSets and ServiceMonitors for Prometheus node exporters to expose `ldmsd` internal metrics from each daemon.
6. Create an LDMS Streams container that aggregates profiling data about computational jobs and persists it for analysis.
```

Horizontal Scaling
---

* The volume of metrics from all producers is too high for a single `ldmsd` aggregator and storage daemon, and `ldmsd` does not auto-scale, and the storage plugin does not benefit from more threads.

* This set of scripts and Helm charts distributes the collection of metrics across several aggregator and storage daemons to prevent metric loss.

* Each Aggregator daemons is given a subset of the nodes.

* Each storage daemon is assigned a specific Aggregator plus a subset of the nodes on that Aggregator.

* A single stream daemon can collect all stream data from the aggregator daemons.

```
# Basic Fanout strategy
nodes
 |--> Agg
 |     |---> Store -> Kafka
 |     |---> Store -> Kafka
 |     `---> Store -> Kafka
 `--> Agg
       |---> Store -> Kafka
       |---> Store -> Kafka
       `---> Store -> Kafka
```

Observability
---

`ldmsd` offers an API for querying internal metrics, including memory usage, processing time, etc.

A Prometheus-style node exporter allows metrics to be scraped and stored in VictoriaMetrics for visualization in Grafana.

This Helm chart includes a metric exporter, which connects to each aggregator and storage daemon, reads internal metrics via the API, and exposes them as Prometheus metrics.

The `ServiceMonitor` advertises the `Service` attached to each node exporter `Pod`, allowing vmagent (VictoriaMetrics Agent, running in Kubernetes) to locate the metrics, and set the scraping frequency.

The Grafan Dashboard Sections:
* Metric Rates Fidelity
  * Sample rate (metric_set/minute) Application, GPU, and CPU Nodes
* LDMS Producer Host Count
  * Node Counts:  Application, Compute, Management Nodes
* LDMSD Metrics
  * Memory usage, Producer State, Metric Rate
* Kubernetes Pod Metrics
  * CPU, Memory, Network for Aggregators, Storage, and Stram Pods
* Kafka Topic: ldms_nersc
  * messages-in/sec, messages-out/sec, consumer-lag
* LDMS Streams
  * console logs showing ldms stream json data
* LDMSD damon logs
  * Connection error count rate
  * Inconsistent error count rate
  * Outstanding updae count rate
  * Oversampling count rate


Kubernetes Objects:
---

StatefulSets create Pods:

```
nersc-ldms-aggr               -> All aggregators daemons in one pod (potentially using multus IPVLAN) to Nodes
nersc-ldms-store              -> Scaled per node_type (in ldms_machine_config.json), read from aggr and write to kafka
nersc-ldms-exporter           -> One pod per ldmsd, read from each dameon, and expose metircs as prometheus exporter 
nersc-ldms-stream             -> One pod, reads from all aggregators daemins (potentially using multus IPVLAN) for extenral access.
```

Service:

```
nersc-ldms-aggr               -> Expose hostname and ports for aggregator daemons
nersc-ldms-store              -> Expose hostname and ports for storage daemons
nersc-ldms-exporter           -> Expose hostname and ports for exporters daemons
nersc-ldms-stream             -> Expose hostname and ports for stream pod
```

ServiceMonitor:

```
nersc-ldms-exporter           -> Signal vmagent to scrape the exporters
```

NetworkAttachmentDefinition:

```
ipvlan-ldms-agg-hsn           -> Multus IpVlan expose Aggregator pod to nodes over HSN interface
ipvlan-ldms-agg-cmn           -> Multus IpVlan expose Steam pod to external host, over CMN interface
```

ConfigMap

```
nersc-ldms-bin                -> Generated script bundle, mounted in pods, to run ldmsd and checking health
nersc-ldms-conf               -> Generated config and environment files, mounted in pods, to run ldmsd and checking health
```

Secrets

```
None provided, but this relies on an externally provided Munge key secret for authentication, mounted in each pod.
```

Build, Deploy, and Test
---

`make` runs the following scripts: `nersc_ldms_init.py`  `mkmanifest.py`, and copies `ConfigMaps` into the Helm chart template directory.

```
make
```

Helm Lint Test: Watch for failed render

```
helm template --debug ls nersc-ldms-aggr
# -or-                                                                          
helm template --debug  --values values.yaml nersc-ldms-aggr                   
```

Deploy:

```
cd .. && ./deploy.py -c nersc-ldms_aggr
# -or-                                                                          
helm install -n telemetry nersc-ldms-aggr nersc-ldms-aggr --values values.yaml    
```

Watch Deployment: wait until all nodes are complete 1/1 or more for the nersc-ldms-aggr

```
kubectl -n sma get pods -w |grep ldms
```

Test:

Once deployed and running, you can view the resource usage:

```
kubectl -n sma top pods --containers |grep ldms
```

Once deployed and running, you can exec into a specific container and talk to ldmsd

```
# Aggregators all run in the same pod, so specify the container name
kubectl -n sma top pods --containers nersc-ldms-aggr-0
POD                 NAME         CPU(cores)   MEMORY(bytes)
nersc-ldms-aggr-0   comp-gpu-2   242m         154Mi
nersc-ldms-aggr-0   comp-gpu-0   256m         169Mi
nersc-ldms-aggr-0   appl         52m          49Mi
nersc-ldms-aggr-0   comp-cpu-2   213m         341Mi
nersc-ldms-aggr-0   comp-gpu-1   237m         149Mi
nersc-ldms-aggr-0   comp-cpu-1   272m         219Mi
nersc-ldms-aggr-0   mana         43m          29Mi
nersc-ldms-aggr-0   comp-gpu-3   199m         198Mi
nersc-ldms-aggr-0   comp-cpu-0   268m         243Mi

# Get a shell on Agg
kubectl -n sma exec -it nersc-ldms-aggr-0 -c comp-cpu-1 -- /bin/bash
# Source the env
source /ldms_conf/ldms-env.nersc-ldms-aggr.compute-cpu-1.sh
# Now talk to the daemon
/ldms_bin/ldms_ls.bash
/ldms_bin/ldms_stats.bash

# Get shell on Store
kubectl -n sma exec -it nersc-ldms-store-compute-cpu-1 -- /bin/bash
# Source the env
source /ldms_conf/ldms-env.${MY_POD_NAME}.sh
# Now talk to the daemon
/ldms_bin/ldms_ls.bash
/ldms_bin/ldms_stats.bash


# Quick round trip
helm -n telemetry delete nersc-ldms-aggr
make clean
make
helm install -n telemetry nersc-ldms-aggr nersc-ldms-aggr --values values.yaml

# Let it startup
kubectl  -n telemetry top pods --containers |grep ldms
nersc-ldms-aggr-0                           slurm-cluster-0            2m           16Mi            
nersc-ldms-exporter-0                       exporter                   1m           27Mi            
nersc-ldms-exporter-1                       exporter                   1m           24Mi            
nersc-ldms-exporter-2                       exporter                   1m           24Mi            
nersc-ldms-store-slurm-cluster-0            store                      2m           10Mi            
nersc-ldms-stream-0                         stream                     1m           13Mi  

```


Unintall
---

```
helm -n sma delete nersc-ldms-aggr
```

Container
---

The container image used by all the pods is built from the oci dir in this repo, which contains directions.

After building a new image infomraiton in update the manifest.yaml.in

TODO:
---

* Abstract constants used for splitting nodes, into variables
* Write units for nersc_ldms_init.py
* Make a test harness that runs a new k8s cluster and deploys
  - deploy
  - perform actions, state, api functional
  - do kubectl commands to interact with services api
  - make fake sls and hsm


================================================
FILE: discovery/roles/telemetry/files/nersc-ldms-aggr/health_check.bash
================================================
#!/bin/bash
echo "LDMS HEALTH CHECK"

function pause {
  echo "press enter to continue"
  read foo
}
NAMESPACE="telemetry"
echo "===================================
[>>] TEST: Check PODS: kubectl -n $NAMESPACE get pods |grep nersc |sort -n "
pause
kubectl -n $NAMESPACE get pods |grep nersc |sort -n

echo "===================================
[>>] TEST: Check Running: kubectl -n $NAMESPACE top pods --containers |grep nersc |sort -n"
pause
kubectl -n $NAMESPACE top pods --containers |grep nersc |sort -n

echo "===================================
[>>] TEST: ldmsd metrics: /ldms_bin/ldms_ls.bash"
pause

# Get one pod
POD="$(kubectl -n sma get pods -l "app=nersc-ldms-store" |grep -v NAME |head -1 |awk '{print $1}')"

# Check ldmsd all the pods from that pod
kubectl -n $NAMESPACE exec -it $POD -c store -- /bin/bash -c 'for i in $(ls /ldms_conf/ldms-env*); do echo "## $i"; source $i && /ldms_bin/ldms_ls.bash ; done'

echo "===================================
[>>] TEST: ldmsd metrics: update_time_stats"

pause
echo "Updater         Min(usec)       Max(usec)       Average(usec)   Count
--------------- --------------- --------------- --------------- ----------"
kubectl -n $NAMESPACE exec -it $POD -c store -- /bin/bash -c 'export PYTHONPATH=/app:/opt/ovis-ldms/lib/python3.10/site-packages; for i in $(ls /ldms_conf/ldms-env*); do echo "## $i"; source $i && /opt/ovis-ldms/bin/ldmsd_controller -a $LDMSD_AUTH_PLUGIN -A $LDMSD_AUTH_OPTION -x sock -h $LDMSD_HOST -p $LDMSD_PORT --cmd "update_time_stats" |egrep -v "Updater|----|division by zero"|awk '"'{print \$3}'"'; done'

echo "===================================
[--] TEST: Metric Exporter: Local: curl localhost from the container
"
kubectl -n $NAMESPACE exec -it nersc-ldms-exporter-0 -- /bin/bash -c 'source /ldms_conf/expo-env.${MY_POD_NAME}.sh; curl -sLk localhost:9101/metrics|grep HELP'

echo "[--] TEST: Metric Exporter: Service: curl nersc-ldms-exporter-0.nersc-ldms-exporter.sma.svc.cluster.local:9101"

kubectl -n $NAMESPACE exec -it nersc-ldms-exporter-0 -- /bin/bash -c "curl -sLk nersc-ldms-exporter-6.nersc-ldms-exporter.sma.svc.cluster.local:9101 |grep HELP"

echo "[--] TEST: The Service should point to this endpoint Container"

kubectl -n $NAMESPACE get endpoints nersc-ldms-exporter -o json |jq -rc '.subsets[0].addresses[]|.hostname'

echo "[--] TEST: We need a ServiceMonitor pointing to the Service" 

kubectl -n $NAMESPACE get servicemonitor nersc-ldms-exporter --show-labels

echo "[--] TEST: Check vmagent logs for scraping errors. Site dependent configuraiton"


================================================
FILE: discovery/roles/telemetry/files/nersc-ldms-aggr/host_map.slurm-cluster.json
================================================
[
    {
        "hostname": "ate-nid001",
        "hostaddr": "192.168.188.21",
        "ip_address": "192.168.188.21",
        "subrole": "Compute"
    }
]

================================================
FILE: discovery/roles/telemetry/files/nersc-ldms-aggr/make_host_map.bash
================================================
#!/bin/bash

if [ ! -d "$
cp host_map.slurm-cluster.json out_dir 


================================================
FILE: discovery/roles/telemetry/files/nersc-ldms-aggr/make_host_map.dell.py
================================================
#!/usr/bin/env python3
# -*- coding: utf-8 -*-
"""
Create host map for ldms config file generation 
"""

import os
import json
import yaml
import time
import shutil
import logging
import argparse
import requests  # pylint: disable=unused-import
import urllib3  # pylint: disable=unused-import

def setup_logging(verbose=False):
    """Configure logging facility."""
    level = logging.DEBUG if verbose else logging.INFO
    logging.basicConfig(level=level, format='%(asctime)s %(levelname)s: %(message)s')

def load_config(config_path):
    """Load the json config file given a file path."""
    if not os.path.exists(config_path):
        return {}
    with open(config_path, 'r') as f:
        return json.load(f)


class LdmsdManager:
    """Generate ldmsd config and params."""

    def __init__(self, config=None):
        self.config = config
        self.base_dir = os.path.dirname(os.path.realpath(__file__))
        self.out_dir = os.path.join(self.base_dir, "out_dir")

    def main(self):
        """Make host lists for each node type."""
        now = time.strftime("%Y%m%d-%H%M%S", time.localtime())
        logging.info(f"BEGIN LDMS INIT: {now}")

        # Clean out previous
        if os.path.isdir(self.out_dir):
            logging.info(f"Clean out_dir: {self.out_dir}")
            shutil.rmtree(self.out_dir)
        os.makedirs(self.out_dir, exist_ok=True)
   
        # PLACE HOLDER: just copy the example file for now
        shutil.copy("host_map.slurm-cluster.json", self.out_dir)

def main():
    parser = argparse.ArgumentParser()
    parser.add_argument(
        "-v", "--verbose",
        action="store_true",
        help="Turn on verbose output"
    )
    parser.add_argument(
        "--config", '-c',
        default='ldms_machine_config.json',
        help="Path to JSON config file"
    )
    args = parser.parse_args()

    config = load_config(args.config)
    verbose = args.verbose if args.verbose is not None else config.get("verbose", False)
    setup_logging(verbose)

    agg = LdmsdManager(config)
    agg.main()

if __name__ == '__main__':
    main()


================================================
FILE: discovery/roles/telemetry/files/nersc-ldms-aggr/manifest.yaml.in
================================================
apiVersion: manifests/v1beta1
metadata:
  name: nersc-ldms-aggr
spec:
  charts:
    - name: nersc-ldms-aggr
      version: 0.1.0
      namespace: sma
      values:
        namespace: sma
        image:
          registry: registry.local
          repository: /nersc/ubuntu-ldms-agg
          tag: 20250804T0856
        net_atat_def: null
        # DISABLED: Stream configuration
        # stream:
        #   resources:
        #     limits:
        #       cpu: 1
        #       memory: 1Gi
        agg:
          resources:
            limits:
              cpu: 1
              memory: 1Gi
        store:
          resources:
            limits:
              cpu: 1
              memory: 1Gi


================================================
FILE: discovery/roles/telemetry/files/nersc-ldms-aggr/mkmanifest.py
================================================
#!/usr/bin/env python3
"""Generate manifest for cluster specific variables"""

import argparse
import json
import logging
import os
import sys

import yaml

logging.basicConfig(level=logging.INFO, format='%(levelname)s: %(message)s')

# Exception classes
class Error(Exception):
    """Generic Error Exception"""
    pass

class NoMachineNameException(Error):
    pass

class NoScratchPathException(Error):
    pass

class NoManifestTemplateException(Error):
    pass

class FailedManifestCreateException(Error):
    pass

class NoIPException(Error):
    pass

# Utility functions
def remove_prefix(input_string, prefix):
    """pre-python-3.9 function to remove prefix string"""
    if prefix and input_string.startswith(prefix):
        return input_string[len(prefix):]
    return input_string

def remove_suffix(input_string, suffix):
    """pre-python-3.9 function to remove suffix string"""
    if suffix and input_string.endswith(suffix):
        return input_string[:-len(suffix)]
    return input_string

def safe_get(dic, keys, default=None):
    """Safely get nested dict key."""
    for k in keys:
        if not isinstance(dic, dict):
            return default
        dic = dic.get(k)
        if dic is None:
            return default
    return dic

def load_yaml_file(path, required=True):
    """Load a YAML file, optionally required."""
    if not os.path.exists(path):
        if required:
            logging.error(f"Required YAML file missing: {path}")
            raise FileNotFoundError(path)
        else:
            logging.warning(f"Optional YAML file missing: {path}")
            return None
    with open(path, 'r') as fh:
        return yaml.safe_load(fh)

def load_json_file(path, required=True):
    """Load a JSON file, optionally required."""
    if not os.path.exists(path):
        if required:
            logging.error(f"Required JSON file missing: {path}")
            raise FileNotFoundError(path)
        else:
            logging.warning(f"Optional JSON file missing: {path}")
            return None
    with open(path, 'r') as fh:
        return json.load(fh)

def harvest_cluster_info(cluster_file):
    """Extract machine name and network variables."""
    conf = load_yaml_file(cluster_file, required=False)
    if conf is None:
        raise FileNotFoundError(f"Cluster file {cluster_file} not found.")
    machine_name = safe_get(conf, ['nersc', 'machineName'])
    if not machine_name:
        logging.error("No machine name found in cluster config!")
        raise NoMachineNameException()
    logging.info(f"Machine name: {machine_name}")
    return machine_name

def harvest_network_vars(vars_file):
    """Extract network-related variables from vars yaml."""
    vars_data = load_yaml_file(vars_file, required=False)
    if vars_data is None:
        raise FileNotFoundError(f"Vars file {vars_file} not found.")
    try:
        allvars = vars_data['all']['vars']
        ldms_agg_ip_hsn = allvars['ldms_agg_ip_hsn']
        hsn_network_prefix = allvars['hsn_network_prefix']
        ldms_agg_gateway_hsn = allvars['bare_metal_nfs_lb']
        ldms_agg_ip_cmn = allvars['ldms_agg_ip_cmn']
        ldms_agg_gateway_cmn = allvars['ldms_agg_gateway_cmn']
        ldms_agg_subnet_prefix_cmn = allvars['cmn_virtual_ip_range']
        omni_network_prefix = allvars['omni_network_prefix']
    except KeyError as e:
        logging.error(f"Missing expected key in vars file: {e}")
        raise NoIPException()
    logging.debug(
        "NetworkAttachDefinition debug\n"
        f"ldms_agg_ip_hsn: {ldms_agg_ip_hsn}, hsn_network_prefix: {hsn_network_prefix}, "
        f"ldms_agg_ip_cmn: {ldms_agg_ip_cmn}, ldms_agg_gateway_cmn: {ldms_agg_gateway_cmn}, "
        f"ldms_agg_subnet_prefix_cmn: {ldms_agg_subnet_prefix_cmn}, omni_network_prefix: {omni_network_prefix}"
    )
    return {
        'ldms_agg_ip_hsn': ldms_agg_ip_hsn,
        'hsn_network_prefix': hsn_network_prefix,
        'ldms_agg_gateway_hsn': ldms_agg_gateway_hsn,
        'ldms_agg_ip_cmn': ldms_agg_ip_cmn,
        'ldms_agg_gateway_cmn': ldms_agg_gateway_cmn,
        'ldms_agg_subnet_prefix_cmn': ldms_agg_subnet_prefix_cmn,
        'omni_network_prefix': omni_network_prefix,
    }

def harvest_replica_info(map_file):
    """Process replica map JSON and extract aggs and replicas."""
    rep_map = load_json_file(map_file)
    store_stateful_replicas = {}
    aggs = []
    # DISABLED: Exporter functionality - set to 0
    replicas_exporter = 0

    for key, val in rep_map.items():
        if key == "stream":
            continue
        store_stateful_replicas[key] = len(val.get('store', []))
        logging.info(f"Replica key: {key}, count: {store_stateful_replicas[key]}")

    # DISABLED: Exporter replica counting
    # for ntype, v1 in rep_map.items():
    #     if ntype == 'stream':
    #         replicas_exporter += 1
    #         continue
    #     for ltype, v2 in v1.items():
    #         replicas_exporter += len(v2)
    logging.info(f"Total exporter replicas (DISABLED): {replicas_exporter}")

    for ntype, val in rep_map.items():
        if ntype == 'stream':
            continue
        for agg in val.get('agg', []):
            aggs.append({
                'name':     agg['LDMSD_ALIAS'],
                'conf':     agg['LDMSD_CONF'],
                'env':      f"/ldms_conf/ldms-env.nersc-ldms-aggr.{agg['LDMSD_ALIAS_LONG']}.sh",
                'port':     agg['LDMSD_PORT'],
            })
    logging.debug(json.dumps(aggs, indent=4, sort_keys=True))
    return aggs, store_stateful_replicas, replicas_exporter

def harvest_sys_config(sys_conf_path):
    """Extract namespace, imagePullSecretsOption, port config, and unique ldms auth info."""
    sys_conf = load_json_file(sys_conf_path)
    sys_opts = sys_conf.get('sys_opts', {})
    namespace = sys_opts.get('namespace')
    img_pull_sec_opt = sys_opts.get('imagePullSecretsOption')
    
    # Extract LDMS port configuration directly from sys_opts
    agg_port = sys_opts.get('agg_port', 6001)
    store_port = sys_opts.get('store_port', 6001)
    
    mounts = {}

    for node_conf in sys_conf.get('node_types',{}).values():
        for conf in (node_conf, node_conf.get('sampler', {})):
            auth_type = conf.get('auth_type')
            if not auth_type:
                continue
            entry = {
                "auth_secret": conf.get("auth_secret"),
                "auth_secret_file": conf.get("auth_secret_file")
            }
            if auth_type not in mounts:
                mounts[auth_type] = []
            if entry not in mounts[auth_type]:
                mounts[auth_type].append(entry)

    # DISABLED: Stream authentication mounting
    # conf = sys_conf.get('stream', None)
    # if conf:
    #     auth_type = conf.get('auth_type')
    #     if auth_type:
    #         entry = {
    #             "auth_secret": conf.get("auth_secret"),
    #             "auth_secret_file": conf.get("auth_secret_file")
    #         }
    #         if auth_type not in mounts:
    #             mounts[auth_type] = []
    #         if entry not in mounts[auth_type]:
    #             mounts[auth_type].append(entry)

    return namespace, img_pull_sec_opt, agg_port, store_port, mounts

def update_manifest(manifest, aggs, store_stateful_replicas, replicas_exporter, net_vars, namespace, img_pull_opts, agg_port, store_port, all_mounts):
    
    charts = safe_get(manifest, ['spec', 'charts'], [])
    for x in charts:
        if x.get('name') == 'nersc-ldms-aggr':
            if x.get('values') is None:
                x['values'] = {}
            if x['values'].get('statefulSet') is None:
                x['values']['statefulSet'] = {}

            if net_vars is not None:
                x['values']['net_atat_def'] = {
                    'hsn': {
                        'name': "ipvlan-ldms-agg-hsn",
                        'iface': "hsn0",
                        'subnet': net_vars['hsn_network_prefix'],
                        'rangeStart': net_vars['ldms_agg_ip_hsn'],
                        'rangeEnd': net_vars['ldms_agg_ip_hsn'],
                        'gateway': None,
                        'routes': [{"dst": "0.0.0.0/0"}]
                    },
                    'cmn': {
                        'name': "ipvlan-ldms-agg-cmn",
                        'iface': "bond0.cmn0",
                        'subnet': net_vars['ldms_agg_subnet_prefix_cmn'],
                        'rangeStart': net_vars['ldms_agg_ip_cmn'],
                        'rangeEnd': net_vars['ldms_agg_ip_cmn'],
                        'gateway': net_vars['ldms_agg_gateway_cmn'],
                        'routes': [
                            {"dst": "0.0.0.0/0"},
                            {"dst": net_vars['omni_network_prefix'], "gw": net_vars['ldms_agg_gateway_cmn']}
                        ]
                    }
                }
            else:
                x['values']['net_atat_def'] = None
            if img_pull_opts is not None:
                x['values']['imagePullSecretsOption'] = img_pull_opts
            if namespace is not None:
                x['namespace'] = namespace
                x['values']['namespace'] = namespace
            
            # Set store port configuration under store section
            if 'store' not in x['values']:
                x['values']['store'] = {}
            x['values']['store']['port'] = store_port

            x['values']['authVolOption'] = []
            x['values']['authVolMountOption'] = []

            if all_mounts:
                # Iterate over auth type
                for auth_type, auth_vals in all_mounts.items():
                    # We just append these
                    if auth_type == "ovis":
                        for sec in auth_vals: 
                            auth_secret = sec.get("auth_secret")
                            x['values']['authVolMountOption'].append(
                                {
                                    "mountPath" : f"/{auth_secret}",
                                    "name" : auth_secret
                                }
                            )        
                            x['values']['authVolOption'].append(
                                { 
                                    "name": auth_secret,
                                    "secret": {
                                        "secretName": auth_secret,
                                        "defaultMode": "0o400"
                                    }
                                }
                            )
                    if auth_type == "munge":
                        for sec in auth_vals:
                            auth_secret = sec.get("auth_secret")
                            x['values']['authVolMountOption'].append(
                                {
                                    "mountPath" : f"/{auth_secret}",
                                    "name" : auth_secret
                                }
                            )        
                            x['values']['authVolOption'].append(
                                { 
                                    "name": auth_secret,
                                    "secret": {
                                        "secretName": auth_secret,
                                        "defaultMode": "0o400"
                                    }
                                }
                            )
                            
            # DISABLED: Exporter functionality
            # x['values']['statefulSet']['exporter'] = {'replicas': replicas_exporter}
            x['values']['statefulSet']['store'] = [{'name': k, 'replicas': v} for k, v in store_stateful_replicas.items()]
            x['values']['aggs'] = aggs
            logging.info("Manifest updated for nersc-ldms-aggr chart.")
    return manifest

def write_yaml_file(path, data, description=None):
    """Write YAML data to file."""
    try:
        with open(path, 'w') as fh:
            yaml.dump(data, fh, indent=2)
        if description:
            logging.info(f"Wrote {description} to {path}")
    except Exception as e:
        logging.error("Failed to write %s to %s: %s", description or 'YAML', path, e)
        raise FailedManifestCreateException() from e

def main():  # pylint: disable=too-many-locals
    """Main function to generate LDMS manifest and values.yaml."""
    parser = argparse.ArgumentParser(description="Generate manifest for cluster specific variables")
    parser.add_argument('--cluster-file', default="/etc/shasta.yml", help="Path to cluster YAML")
    parser.add_argument('--manifest-template', default="manifest.yaml.in", help="Path to manifest template YAML")
    parser.add_argument('--output-manifest', default="manifest.yaml", help="Path for output manifest")
    parser.add_argument('--replica-map', default="out_dir/nersc-ldmsd-port-map.json", help="Path to replica map JSON")
    parser.add_argument('--sys_conf', default='ldms_machine_config.json', help="Path to ldms_machine_config JSON")
    parser.add_argument('--values-output', default="values.yaml", help="Path for output values.yaml")
    args = parser.parse_args()

    here = os.path.dirname(os.path.abspath(__file__))

    cluster_file = os.path.abspath(args.cluster_file)
    manifest_template_file = os.path.join(here, args.manifest_template)
    manifest_output_file = os.path.join(here, args.output_manifest)
    replica_map_file = os.path.join(here, args.replica_map)
    sys_conf = os.path.join(here, args.sys_conf)
    values_output_file = os.path.join(here, args.values_output)

    logging.info("JOB: Generate manifest: %s", manifest_output_file)

    # Step 1: Cluster info and vars file
    net_vars = None
    machine_name = None
    try:
        machine_name = harvest_cluster_info(cluster_file)
        vars_file = os.path.join(here, "..", "..", f"{machine_name}_vars", "nersc.yaml")
        try:
            net_vars = harvest_network_vars(vars_file)
        except FileNotFoundError:
            logging.warning("Vars file %s not found. Skipping population of network variables.", vars_file)
    except FileNotFoundError:
        logging.warning("Cluster file %s not found. Skipping population of network variables.", cluster_file)

    # Step 2: Replica info
    aggs, store_stateful_replicas, replicas_exporter = harvest_replica_info(replica_map_file)

    # Step 3: System config
    namespace, img_pull_sec_opt, agg_port, store_port, all_mounts = harvest_sys_config(sys_conf)

    # Step 4: Load manifest template
    manifest = load_yaml_file(manifest_template_file)
    if not manifest:
        logging.error("Manifest template could not be loaded.")
        raise NoManifestTemplateException()

    # Step 5: Update manifest
    manifest = update_manifest(manifest, aggs, store_stateful_replicas, replicas_exporter, net_vars, namespace, img_pull_sec_opt, agg_port, store_port, all_mounts)

    # Step 6: Write manifest.yaml
    write_yaml_file(manifest_output_file, manifest, description="manifest")

    # Step 7: Write values.yaml as before
    chart_values = None
    for chart in manifest.get('spec', {}).get('charts', []):
        if chart.get('name') == 'nersc-ldms-aggr':
            chart_values = chart.get('values')
            break

    if chart_values is not None:
        write_yaml_file(values_output_file, chart_values, description="values.yaml")
    else:
        logging.error("Could not find values for 'nersc-ldms-aggr' chart to write to values.yaml")
        raise FailedManifestCreateException("Missing values for 'nersc-ldms-aggr' chart")

    logging.info("Manifest generation complete.")

if __name__ == '__main__':
    try:
        main()
    except Exception as e:  # pylint: disable=broad-exception-caught
        logging.critical("Fatal error: %s", e)
        sys.exit(1)


================================================
FILE: discovery/roles/telemetry/files/nersc-ldms-aggr/nersc-ldms-aggr/Chart.yaml
================================================
apiVersion: v2
name: nersc-ldms-aggr
description: A Helm chart for Kubernetes to deploy a nersc ldms aggregator

# A chart can be either an 'application' or a 'library' chart.
#
# Application charts are a collection of templates that can be packaged into versioned archives
# to be deployed.
#
# Library charts provide useful utilities or functions for the chart developer. They're included as
# a dependency of application charts to inject those utilities and functions into the rendering
# pipeline. Library charts do not define any templates and therefore cannot be deployed.
type: application

# This is the chart version. This version number should be incremented each time you make changes
# to the chart and its templates, including the app version.
# Versions are expected to follow Semantic Versioning (https://semver.org/)
version: 0.1.0

# This is the version number of the application being deployed. This version number should be
# incremented each time you make changes to the application. Versions are not expected to
# follow Semantic Versioning. They should reflect the version the application is using.
appVersion: 0.1.0


================================================
FILE: discovery/roles/telemetry/files/nersc-ldms-aggr/nersc-ldms-aggr/templates/NetworkAttachmentDefinition.yaml
================================================
{{- if .Values.net_atat_def }}
{{- range $net_name, $net := .Values.net_atat_def }}
---
apiVersion: k8s.cni.cncf.io/v1
kind: NetworkAttachmentDefinition
metadata:
  name: {{ $net.name }}
  namespace: {{ $.Values.namespace }}
  annotations:
   "helm.sh/resource-policy": keep
spec:
  config: |
    {
      "cniVersion": "0.3.0",
      "name": {{ $net.name | quote }},
      "type": "ipvlan",
      "master": {{ $net.iface | quote }}, 
      "mode": "l2",
      "ipam": {
        "type": "host-local",
        "subnet": {{ $net.subnet | quote }},
        "rangeStart": {{ $net.rangeStart | quote }},
        "rangeEnd": {{ $net.rangeEnd | quote }},
        "routes" : {{- toYaml $net.routes | nindent 8 }}
      }
    }
{{- end }}
{{- end }}


================================================
FILE: discovery/roles/telemetry/files/nersc-ldms-aggr/nersc-ldms-aggr/templates/Service.nersc-ldms-agg.yaml
================================================
apiVersion: v1
kind: Service
metadata:
  annotations:
    alpha.monitoring.coreos.com/non-namespaced: "true"
  labels:
    export: ldmsd-agg
  name: nersc-ldms-aggr
  namespace: {{ .Values.namespace }}
spec:
  ports:
  {{- range .Values.aggs }}
  - name: {{ .name }}
    port: {{ .port }}
    protocol: TCP
    targetPort: {{ .port }}
  {{- end }}
  selector:
    app: nersc-ldms-aggr
  sessionAffinity: None
  type: ClusterIP


================================================
FILE: discovery/roles/telemetry/files/nersc-ldms-aggr/nersc-ldms-aggr/templates/Service.nersc-ldms-store.yaml
================================================
apiVersion: v1
kind: Service
metadata:
  name: nersc-ldms-store
  namespace: {{ .Values.namespace }}
spec:
  selector:
    app: nersc-ldms-store
  clusterIP: None
  ports:
    - protocol: TCP
      port: {{ .Values.store.port }}
      targetPort: {{ .Values.store.port }}


================================================
FILE: discovery/roles/telemetry/files/nersc-ldms-aggr/nersc-ldms-aggr/templates/Statefulset.nersc-ldms-agg.yaml
================================================
---
apiVersion: apps/v1
kind: StatefulSet
metadata:
  name: nersc-ldms-aggr
  namespace: {{ .Values.namespace }}
spec:
  serviceName: nersc-ldms-aggr
  replicas: 1
  selector:
    matchLabels:
      app: nersc-ldms-aggr
  template:
    metadata:
      labels:
        app: nersc-ldms-aggr
      annotations:
        service.cray.io/public: "true"
        {{- if .Values.net_atat_def }}
        k8s.v1.cni.cncf.io/networks: ipvlan-ldms-agg-hsn
        {{- end }}
    spec:
      hostname: nersc-ldms-aggr
      {{- if .Values.imagePullSecretsOption }}
      {{- toYaml .Values.imagePullSecretsOption | nindent 6 }}
      {{- end }}
      containers:
        {{- range .Values.aggs }}
        - name: {{ .name }}
          image: {{ $.Values.image.registry }}{{ $.Values.image.repository }}:{{ $.Values.image.tag }}
          imagePullPolicy: IfNotPresent
          args:
            - /bin/bash
            - -c
            - /ldms_bin/start_munge.bash /ldms_conf/nersc-munge-key_munge.conf && while [ 1 ]; do source {{ .env }} ; /ldms_bin/ldmsd.bash; echo -n "\nLDMSD ${MY_CONTAINER_NAME} RESTARTED, EXIT CODE $?\n"; sleep 5; done
          env:
            - name: MY_CONTAINER_NAME
              value: {{ .name }}
            - name: MY_POD_NAME
              valueFrom:
                fieldRef:
                  apiVersion: v1
                  fieldPath: metadata.name
            - name: MY_NODE_NAME
              valueFrom:
                fieldRef:
                  apiVersion: v1
                  fieldPath: spec.nodeName
          volumeMounts:
            - name: ldms-conf
              mountPath: /ldms_conf
            - name: ldms-bin
              mountPath: /ldms_bin
{{- if $.Values.authVolMountOption }}
{{- toYaml $.Values.authVolMountOption | nindent 12 }}
{{- end }}
          resources:
            {{- toYaml $.Values.agg.resources | nindent 12 }}
        {{- end }}
      dnsPolicy: ClusterFirst
      enableServiceLinks: true
      hostname: nersc-ldms-aggr
      priority: 0
      restartPolicy: Always
      schedulerName: default-scheduler
      securityContext: {}
      serviceAccount: default
      serviceAccountName: default
      subdomain: nersc-ldms-aggr
      terminationGracePeriodSeconds: 30
      tolerations:
        - effect: NoExecute
          key: node.kubernetes.io/not-ready
          operator: Exists
          tolerationSeconds: 300
        - effect: NoExecute
          key: node.kubernetes.io/unreachable
          operator: Exists
          tolerationSeconds: 300
      volumes:
        - name: ldms-conf
          configMap:
            name: nersc-ldms-conf
        - name: ldms-bin
          configMap:
            name: nersc-ldms-bin
            defaultMode: 0500
{{- if .Values.authVolOption }}
{{ toYaml .Values.authVolOption | nindent 8 }}
{{- end }}


================================================
FILE: discovery/roles/telemetry/files/nersc-ldms-aggr/nersc-ldms-aggr/templates/Statefulset.nersc-ldms-store.yaml
================================================
{{- range .Values.statefulSet.store }}
---
apiVersion: apps/v1
kind: StatefulSet
metadata:
  name: nersc-ldms-store-{{ .name }}
  namespace: {{ $.Values.namespace }}
spec:
  serviceName: nersc-ldms-store
  replicas: {{ .replicas | int }}
  selector:
    matchLabels:
      app: nersc-ldms-store
  template:
    metadata:
      labels:
        app: nersc-ldms-store
    spec:
      {{- if $.Values.imagePullSecretsOption }}
      {{- toYaml $.Values.imagePullSecretsOption | nindent 6 }}
      {{- end }}
      containers:
        - name: store
          {{- with $.Values.image }}
          image: {{ .registry }}{{ .repository }}:{{ .tag }}
          {{- end }}
          imagePullPolicy: IfNotPresent
          args:
            - /bin/bash
            - -c
            - /ldms_bin/start_munge.bash /ldms_conf/nersc-munge-key_munge.conf && while [ 1 ]; do source /ldms_conf/ldms-env.${MY_POD_NAME}.sh && /ldms_bin/ldmsd.bash; echo -n "\nLDMSD ${MY_POD_NAME} RESTARTED, EXIT CODE $?\n"; sleep 5; done
          env:
            - name: MY_CONTAINER_NAME
              value: store
            - name: MY_POD_NAME
              valueFrom:
                fieldRef:
                  apiVersion: v1
                  fieldPath: metadata.name
            - name: MY_NODE_NAME
              valueFrom:
                fieldRef:
                  apiVersion: v1
                  fieldPath: spec.nodeName
          volumeMounts:
            - name: ldms-conf
              mountPath: /ldms_conf
            - name: ldms-bin
              mountPath: /ldms_bin
            - name: kafkapump-certs
              mountPath: /ldms_certs
              readOnly: true
{{- if $.Values.authVolMountOption }}
{{- toYaml $.Values.authVolMountOption | nindent 12 }}
{{- end }}
      priority: 0
      restartPolicy: Always
      schedulerName: default-scheduler
      securityContext: {}
      serviceAccount: default
      serviceAccountName: default
      subdomain: nersc-ldms-store
      terminationGracePeriodSeconds: 30
      tolerations:
        - effect: NoExecute
          key: node.kubernetes.io/not-ready
          operator: Exists
          tolerationSeconds: 300
        - effect: NoExecute
          key: node.kubernetes.io/unreachable
          operator: Exists
          tolerationSeconds: 300
      volumes:
        - name: ldms-conf
          configMap:
            name: nersc-ldms-conf
        - name: ldms-bin
          configMap:
            name: nersc-ldms-bin
            defaultMode: 0500
        - name: kafkapump-certs
          projected:
            sources:
              - secret:
                  name: kafka-cluster-ca-cert
                  items:
                    - key: ca.crt
                      path: ca.crt
              - secret:
                  name: kafkapump
                  items:
                    - key: user.crt
                      path: user.crt
                    - key: user.key
                      path: user.key
{{- if $.Values.authVolOption }}
{{ toYaml $.Values.authVolOption | nindent 8 }}
{{- end }}
{{- end }}


================================================
FILE: discovery/roles/telemetry/files/nersc-ldms-aggr/nersc_ldms_make_ldms_config.py
================================================
#!/usr/bin/env python3
# -*- coding: utf-8 -*-
"""
Create ldmsd config files and parameters from host map files.
"""

import argparse
import json
import logging
import os
import shutil
import time
import yaml  # pylint: disable=import-error

def setup_logging(verbose_mode=False):
    """Configure logging."""
    level = logging.DEBUG if verbose_mode else logging.INFO
    logging.basicConfig(level=level, format='%(asctime)s %(levelname)s: %(message)s')

def load_config(config_path):
    """Load JSON config file from a given file path."""
    if not os.path.exists(config_path):
        return {}
    with open(config_path, 'r', encoding='utf-8') as f:
        return json.load(f)

def str_presenter(dumper, data):
    """Custom YAML representer for multiline strings."""
    if len(data.splitlines()) > 1:
        return dumper.represent_scalar('tag:yaml.org,2002:str', data, style='|')
    return dumper.represent_scalar('tag:yaml.org,2002:str', data)

class LdmsdManager:  # pylint: disable=too-many-instance-attributes
    """Generate ldmsd configs and parameters."""

    def __init__(self, config=None):
        self.config = config
        self.namespace = self.config['sys_opts']['namespace']
        self.base_dir = os.path.dirname(os.path.realpath(__file__))
        self.out_dir = os.path.join(self.base_dir, "out_dir")
        self.env = {}
        self.configmaps = []

        # Read port configuration directly from sys_opts
        self.agg_port = self.config['sys_opts'].get('agg_port', 6001)
        self.store_port = self.config['sys_opts'].get('store_port', 6001)
        
        # Initialize to agg_port - 1 because make_agg_configs increments before use
        self.ldmsd_port = self.agg_port - 1

        logging.info("LDMS Port Configuration:")
        logging.info("  Aggregator ports start from: %s", self.agg_port)
        logging.info("  Store port: %s", self.store_port)

    def main(self):
        """Main loop."""
        now = time.strftime("%Y%m%d-%H%M%S", time.localtime())
        logging.info("BEGIN LDMS Make LDMS Config: %s", now)
        self.make_agg_configs()
        self.make_store_configs()
        # DISABLED: Stream and Exporter functionality
        # self.make_stream_config()
        # self.make_exporter_configs()
        self.make_munge_configs()
        self.create_env_json()
        self.create_env_yaml()
        self.create_configmaps()
        self.copy_configmaps_to_helm()
        now = time.strftime("%Y%m%d-%H%M%S", time.localtime())
        logging.info("END LDMS Make LDMS Config: %s", now)

    def make_munge_configs(self):
        """Generate munge configuration files."""
        logging.info("Make Munge Configs")
        munge_configs = {}

        for node_conf in self.config.get('node_types', {}).values():
            for conf in (node_conf, node_conf.get('sampler', {})):
                auth_type = conf.get('auth_type')
                if not auth_type:
                    continue
                if auth_type == "munge":
                    auth_secret = conf.get('auth_secret')
                    conf_file_name = f"{auth_secret}_munge.conf"
                    munge_configs[conf_file_name] = {
                        "MUNGED_BIN" : "/usr/sbin/munged",
                        "MUNGE_RUN_DIR": f"/run/{auth_secret}",
                        "MUNGE_PID_FILE": "$MUNGE_RUN_DIR/munged.pid",
                        "MUNGE_SOCKET_FILE": "$MUNGE_RUN_DIR/munge.socket",
                        "MUNGE_LOG_DIR" : "/var/log/munge",
                        "MUNGE_LOG_FILE" : f"$MUNGE_LOG_DIR/{auth_secret}.log",
                        "MUNGE_KEY_FILE" : f"/{auth_secret}/munge.key"
                    }
        for conf_file_name, munge_conf in munge_configs.items():
            config_lines = []
            for key, value in munge_conf.items():
                config_lines.append(f'export {key}="{value}"')
            with open(os.path.join(self.out_dir, conf_file_name), "w",
                      encoding='utf-8') as f:
                f.write("\n".join(config_lines))
            self.configmaps.extend([
                os.path.join(self.out_dir, conf_file_name)
            ])

    def make_agg_configs(self):  # pylint: disable=too-many-locals
        """Generate aggregator configuration files."""
        logging.info("Make Agg Configs")

        for ldmsd_name, ldmsd_conf in self.config['node_types'].items():
            # grab auth data
            auth_type = ldmsd_conf.get('auth_type')
            auth_secret = ldmsd_conf.get('auth_secret')
            auth_secret_file = ldmsd_conf.get('auth_secret_file')
            if auth_type == "munge":
                ldms_auth_option = f"socket=/run/{auth_secret}/munge.socket"
            elif auth_type == "ovis":
                ldms_auth_option = f"conf=/{auth_secret}/{auth_secret_file}"
            else:
                ldms_auth_option = ""

            host_map_file = ldmsd_conf["host_map_file"]
            with open(host_map_file, encoding='utf-8') as fh:
                node_list = json.load(fh)
            split = ldmsd_conf.get("agg_count", 1)
            midpoint = len(node_list) // split
            for index, sub_list in enumerate(self.split_list(node_list, midpoint)):
                sub_host_map_file = host_map_file.replace(".json", f"-{index}.json")
                with open(sub_host_map_file, 'w', encoding='utf-8') as fh:
                    json.dump(sub_list, fh, ensure_ascii=False, indent=4)
                self.ldmsd_port += 1
                alias_base = ldmsd_conf.get("alias", "other")
                container_alias = f"{alias_base}-{index}"
                logging.info(
                    "\tSPLIT: container_alias: %s, index: %s, len sub_list: %s",
                    container_alias, index, len(sub_list)
                )
                self.make_config_agg(
                    ldmsd_conf=ldmsd_conf,
                    nodes=sub_list,
                    out_file=os.path.join(
                        self.out_dir,
                        f"ldmsd.nersc-ldms-aggr.{ldmsd_name}-{index}.conf"
                    )
                )
                self.env.setdefault(ldmsd_name, {}).setdefault('agg', []).append({
                    'LDMSD_PORT': self.ldmsd_port,
                    'LDMSD_HOST': f"nersc-ldms-aggr.{self.namespace}.svc.cluster.local",
                    'LDMSD_AUTH_PLUGIN': f"{auth_type}",
                    'LDMSD_AUTH_OPTION': f"{ldms_auth_option}",
                    'LDMSD_AUTH_SECRET': f"{auth_secret}",
                    'LDMSD_AUTH_SECRET_FILE' : f"{auth_secret_file}",
                    'LDMSD_ALIAS': container_alias,
                    'LDMSD_ALIAS_LONG': f"{ldmsd_name}-{index}",
                    'LDMSD_CONF': f"/ldms_conf/ldmsd.nersc-ldms-aggr.{ldmsd_name}-{index}.conf",
                    # 'EXPORTER_PORT': 9101  # DISABLED: Exporter functionality
                })
                # Create environment file with pod name pattern for StatefulSet compatibility
                pod_name = f"nersc-ldms-aggr-{index}"
                self.create_ldms_env(
                    os.path.join(self.out_dir, f"ldms-env.{pod_name}.sh"),
                    self.env[ldmsd_name]['agg'][-1]
                )
                # Also create the original cluster-based name for backward compatibility
                self.create_ldms_env(
                    os.path.join(self.out_dir, f"ldms-env.nersc-ldms-aggr.{ldmsd_name}-{index}.sh"),
                    self.env[ldmsd_name]['agg'][-1]
                )
                self.configmaps.extend([
                    os.path.join(self.out_dir, f"ldmsd.nersc-ldms-aggr.{ldmsd_name}-{index}.conf"),
                    os.path.join(self.out_dir, f"ldms-env.nersc-ldms-aggr.{ldmsd_name}-{index}.sh"),
                    os.path.join(self.out_dir, f"ldms-env.{pod_name}.sh")
                ])

    def make_store_configs(self):  # pylint: disable=too-many-locals
        """Generate store configuration files."""
        logging.info("Make Store Configs")
        
        for ldmsd_name, ldmsd_conf in self.config['node_types'].items():
            # grab auth data
            auth_type = ldmsd_conf.get('auth_type')
            auth_secret = ldmsd_conf.get('auth_secret')
            auth_secret_file = ldmsd_conf.get('auth_secret_file')
            if auth_type == "munge":
                ldms_auth_option = f"socket=/run/{auth_secret}/munge.socket"
            elif auth_type == "ovis":
                ldms_auth_option = f"conf=/{auth_secret}/{auth_secret_file}"

            store_pod_index = 0
            host_map_file = ldmsd_conf["host_map_file"]
            for agg_index in range(len(self.env[ldmsd_name]['agg'])):
                with open(host_map_file.replace(".json", f"-{agg_index}.json"),
                          encoding='utf-8') as fh:
                    node_list = json.load(fh)
                nid_names = [x['hostname'] for x in node_list]
                split = ldmsd_conf.get("store_split", 99999999)
                for index, sub_list in enumerate(self.split_list(nid_names, split)):
                    alias_base = ldmsd_conf.get("alias", "other")
                    container_alias = f"{alias_base}-{store_pod_index}"
                    logging.info(
                        "\tSPLIT: container_alias: %s, index: %s, len sub_list: %s",
                        container_alias, index, len(sub_list)
                    )
                    split_regex = "|".join([f"{x}.*" for x in sub_list])
                    self.make_config_store(
                        ldmsd_name=f"{ldmsd_name}-{store_pod_index}",
                        ldmsd_agg_name=self.env[ldmsd_name]['agg'][agg_index]["LDMSD_HOST"],
                        ldmsd_agg_port=self.env[ldmsd_name]['agg'][agg_index]["LDMSD_PORT"],
                        ldmsd_conf=ldmsd_conf,
                        out_file=os.path.join(self.out_dir, f"ldmsd.nersc-ldms-store-{ldmsd_name}-{store_pod_index}.conf"),
                        split=split_regex
                    )
                    self.env.setdefault(ldmsd_name, {}).setdefault('store', []).append({
                        'LDMSD_PORT': self.store_port,
                        'LDMSD_HOST': f"nersc-ldms-store-{ldmsd_name}-{store_pod_index}.nersc-ldms-store.{self.namespace}.svc.cluster.local",
                        'LDMSD_AUTH_PLUGIN': auth_type,
                        'LDMSD_AUTH_SECRET': f"{auth_secret}",
                        'LDMSD_AUTH_SECRET_FILE' : f"{auth_secret_file}",
                        'LDMSD_AUTH_OPTION': f"socket=/run/{auth_secret}/munge.socket",
                        'LDMSD_ALIAS': container_alias,
                        'LDMSD_CONF': f"/ldms_conf/ldmsd.nersc-ldms-store-{ldmsd_name}-{store_pod_index}.conf",
                        # 'EXPORTER_PORT': 9101  # DISABLED: Exporter functionality
                    })
                    # Create environment file with pod name pattern for StatefulSet compatibility
                    store_pod_name = f"nersc-ldms-store-{ldmsd_name}-{store_pod_index}"
                    self.create_ldms_env(
                        os.path.join(self.out_dir, f"ldms-env.{store_pod_name}.sh"),
                        self.env[ldmsd_name]['store'][-1]
                    )
                    # Also create the original cluster-based name for backward compatibility
                    self.create_ldms_env(
                        os.path.join(self.out_dir, f"ldms-env.nersc-ldms-store-{ldmsd_name}-{store_pod_index}.sh"),
                        self.env[ldmsd_name]['store'][-1]
                    )
                    self.configmaps.extend([
                        os.path.join(self.out_dir, f"ldmsd.nersc-ldms-store-{ldmsd_name}-{store_pod_index}.conf"),
                        os.path.join(self.out_dir, f"ldms-env.nersc-ldms-store-{ldmsd_name}-{store_pod_index}.sh"),
                        os.path.join(self.out_dir, f"ldms-env.{store_pod_name}.sh")
                    ])
                    store_pod_index += 1

    # DISABLED: Stream functionality - commented out
    # def make_config_stream(self, out_file):
    #     """Make the ldmsd config file for the stream
    #     This ldmsd must talk to the other aggregators via their service name, and respective ports
    #     :param out_file: string path to output file
    #     """
    #     logging.info("Create Stream Config")
    #     if os.path.isfile(out_file):
    #         logging.info(f"File already present: {out_file}")
    #         return
    #     cfg = list()
    #     #--------
    #     # Get uniqe auth types
    #     munge_auth_sec = set( v['auth_secret'] for k, v in self.config['node_types'].items())
    #     for auth_secret in munge_auth_sec:
    #         cfg.extend([
    #             f"auth_add name={auth_secret} plugin=munge socket=/run/{auth_secret}/munge.socket",
    #         ])
    #     #--------
    #     ldms_host = "nersc-ldms-aggr.sma.svc.cluster.local"
    #     for k, v in self.env.items():  #  k: application, compute-cpu, compute-gpu, management
    #         if k == "stream":
    #             continue
    #         for index, sub_list in enumerate(v['agg']):
    #             ldmsd_name = f"{k}-{index}"   # e.g. compute-cpu-0
    #             ldmsd_port = sub_list['LDMSD_PORT']
    #             auth_secret = sub_list['LDMSD_AUTH_SECRET']
    #             auth_type = 'munge'
    #             auth_arg = 'socket=/run/{auth_secret}/munge.socket'
    #             logging.debug(f"ldmsd_name:{ldmsd_name} ldmsd_port:{ldmsd_port}, auth_type:{auth_type}, auth_arg:{auth_arg}, auth_secret:{auth_secret}")
    #             cfg.extend([
    #                 f"prdcr_add name=prdcr_{ldmsd_name} type=active interval=30000000 xprt=sock host={ldms_host} port={ldmsd_port} auth={auth_secret}",
    #             ])
    #     cfg.extend([
    #         "prdcr_start_regex regex=.*",
    #         "prdcr_subscribe stream=nersc regex=.*",
    #     ])
    #     # To avoid reading metrics, and only handle streams make a pattern that will never match
    #     cfg.extend([
    #         f"updtr_add name=stream interval=10000000 auto_interval=true  #(Honor hints if true)",
    #         f"updtr_prdcr_add name=stream regex=prdcr.*",
    #         f"updtr_match_add name=stream match=schema regex=(DONOTMATCH)"
    #         f"updtr_start name=stream"
    #     ])
    #     cfg.extend([
    #         "#Log Stream data",
    #         "load name=hello_sampler",
    #         "config name=hello_sampler producer=${HOSTNAME} instance=${HOSTNAME}/hello_sampler stream=nersc component_id=1",
    #         "start name=hello_sampler interval=1000000 offset=0"
    #     ])
    #     with open(out_file, 'w') as fh:
    #         fh.write('\n'.join(cfg))
    #         title = "Wrote:"
    #         logging.debug(f"{title:.<20} {out_file}")

    # DISABLED: Stream configuration - commented out
    # def make_stream_config(self):
    #     logging.info("Create Stream Config")
    #     auth_type = self.config['stream'].get('auth_type')
    #     auth_secret = self.config['stream'].get('auth_secret')
    #     auth_secret_file = self.config['stream'].get('auth_secret_file')
    #     if auth_type == "munge":
    #         ldms_auth_option = f"socket=/run/{auth_secret}/munge.socket"
    #     elif auth_type == "ovis":
    #         ldms_auth_option = f"conf=/{auth_secret}/{auth_secret_file}"
    #     else:
    #         logging.error(f"Unhandled auth_type. self.config: {self.config}")
    #         raise
    #     self.make_config_stream(
    #         out_file=os.path.join(self.out_dir, "ldmsd.nersc-ldms-stream-0.conf")
    #     )
    #     self.env.setdefault('stream', [])
    #     self.env['stream'].append({
    #         'LDMSD_PORT': 60001,
    #         'LDMSD_HOST': f"nersc-ldms-stream-0.nersc-ldms-stream.{self.namespace}.svc.cluster.local",
    #         'LDMSD_AUTH_PLUGIN': auth_type,
    #         'LDMSD_AUTH_SECRET': f"{auth_secret}",
    #         'LDMSD_AUTH_SECRET_FILE' : f"{auth_secret_file}",
    #         'LDMSD_AUTH_OPTION': ldms_auth_option,
    #         'LDMSD_CONF': "/ldms_conf/ldmsd.nersc-ldms-stream-0.conf",
    #         'EXPORTER_PORT': 9101,
    #     })
    #     self.create_ldms_env(
    #         os.path.join(self.out_dir, "ldms-env.nersc-ldms-stream-0.sh"),
    #         self.env['stream'][-1]
    #     )
    #     self.configmaps.extend([
    #         os.path.join(self.out_dir, "ldmsd.nersc-ldms-stream-0.conf"),
    #         os.path.join(self.out_dir, "ldms-env.nersc-ldms-stream-0.sh")
    #     ])

    # DISABLED: Exporter configuration - commented out
    # def make_exporter_configs(self):
    #     logging.info("Create Exporter Config")
    #     expo = []
    #     for ntype, val in self.env.items():
    #         if ntype == 'stream':
    #             expo.append({
    #                 'EXPORTER_NAME': 'stream-metrics',
    #                 'LDMSD_HOST': val[0]['LDMSD_HOST'],
    #                 'LDMSD_PORT': val[0]['LDMSD_PORT'],
    #                 'LDMSD_AUTH_PLUGIN': val[0]['LDMSD_AUTH_PLUGIN'],
    #                 'LDMSD_AUTH_SECRET': val[0]['LDMSD_AUTH_SECRET'],
    #                 'LDMSD_AUTH_SECRET_FILE' : val[0]['LDMSD_AUTH_SECRET_FILE'],
    #                 'LDMSD_AUTH_OPTION': val[0]['LDMSD_AUTH_OPTION'],
    #                 'EXPORTER_PORT': val[0]['EXPORTER_PORT']
    #             })
    #             continue
    #         for agg in val.get('agg', []):
    #             expo.append({
    #                 'EXPORTER_NAME': f"agg-{agg['LDMSD_ALIAS']}-metrics",
    #                 'LDMSD_HOST': agg['LDMSD_HOST'],
    #                 'LDMSD_PORT': agg['LDMSD_PORT'],
    #                 'LDMSD_AUTH_PLUGIN': agg['LDMSD_AUTH_PLUGIN'],
    #                 'LDMSD_AUTH_SECRET': agg['LDMSD_AUTH_SECRET'],
    #                 'LDMSD_AUTH_SECRET_FILE': agg['LDMSD_AUTH_SECRET_FILE'],
    #                 'LDMSD_AUTH_OPTION': agg['LDMSD_AUTH_OPTION'],
    #                 'EXPORTER_PORT': agg['EXPORTER_PORT']
    #             })
    #         for store in val.get('store', []):
    #             expo.append({
    #                 'EXPORTER_NAME': f"store-{store['LDMSD_ALIAS']}-metrics",
    #                 'LDMSD_HOST': store['LDMSD_HOST'],
    #                 'LDMSD_PORT': store['LDMSD_PORT'],
    #                 'LDMSD_AUTH_PLUGIN': store['LDMSD_AUTH_PLUGIN'],
    #                 'LDMSD_AUTH_SECRET': store['LDMSD_AUTH_SECRET'],
    #                 'LDMSD_AUTH_SECRET_FILE': store['LDMSD_AUTH_SECRET_FILE'],
    #                 'LDMSD_AUTH_OPTION': store['LDMSD_AUTH_OPTION'],
    #                 'EXPORTER_PORT': store['EXPORTER_PORT']
    #             })
    #     for i, exporter in enumerate(expo):
    #         self.create_ldms_env(
    #             os.path.join(self.out_dir, f"expo-env.nersc-ldms-exporter-{i}.sh"),
    #             exporter
    #         )
    #         self.configmaps.append(
    #             os.path.join(self.out_dir, f"expo-env.nersc-ldms-exporter-{i}.sh")
    #         )

    def create_env_json(self):
        """Write env data structure to JSON."""
        with open(os.path.join(self.out_dir, "nersc-ldmsd-port-map.json"), 'w',
                  encoding='utf-8') as fh:
            json.dump(self.env, fh, ensure_ascii=False, sort_keys=True, indent=4)

    def create_env_yaml(self):
        """Write env data structure to YAML."""
        yaml.add_representer(str, str_presenter)
        yaml.representer.SafeRepresenter.add_representer(str, str_presenter)
        with open(os.path.join(self.out_dir, "nersc-ldmsd-port-map.yml"), 'w',
                  encoding='utf-8') as fh:
            #yaml.dump(self.env, fh, default_flow_style=False, sort_keys=False)
            yaml.dump(self.env, fh, default_flow_style=False)

    def create_ldms_env(self, out_file, data):
        """Create the env file used before running ldmsd."""
        with open(out_file, "w", encoding='utf-8') as fh:
            for k, v in data.items():
                fh.write(f'export {k}="{v}"\n')

    def asseble_configmap_data(self, files_list):
        """Load data object with script files."""
        data = {}
        for fname in files_list:
            base_fname = os.path.basename(fname)
            if not fname in data:
                with open(fname, encoding='utf-8') as fh:
                    data[base_fname] = fh.read()
        return data

    def create_configmaps(self):
        """Create configmap YAMLs for configs and scripts."""
        data = self.asseble_configmap_data(self.configmaps)
        self.create_configmap_yaml(
            name="nersc-ldms-conf",
            namespace=self.namespace,
            data=data,
            out_filename=os.path.join(self.out_dir, "cm.nersc-ldms-conf.yaml")
        )
        script_files = [
            "scripts/ldmsd.bash",
            "scripts/ldmsd_stream.bash",
            "scripts/ldms_ls.bash",
            "scripts/ldms_stats.bash",
            "scripts/start_munge.bash",
            "scripts/decomp.json",
            "scripts/kafka.conf"
        ]
        data = self.asseble_configmap_data(script_files)
        self.create_configmap_yaml(
            name="nersc-ldms-bin",
            namespace=self.namespace,
            data=data,
            out_filename=os.path.join(self.out_dir, "cm.nersc-ldms-bin.yaml")
        )

    def copy_configmaps_to_helm(self):
        """Copy generated configmaps into the helm chart."""
        for i in ["cm.nersc-ldms-conf.yaml", "cm.nersc-ldms-bin.yaml"]:
            src_path = os.path.join(self.out_dir, i)
            dst_path = os.path.join(self.base_dir, "nersc-ldms-aggr", "templates", i)
            shutil.copy2(src_path, dst_path)

    def create_configmap_yaml(self, name, namespace, data, out_filename):
        """Creates ConfigMap YAML file, using custom str_presenter."""
        configmap = {
            'apiVersion': 'v1',
            'kind': 'ConfigMap',
            'metadata': {
                'name': name,
                'namespace': namespace
            },
            'data': data
        }
        yaml.add_representer(str, str_presenter)
        yaml.representer.SafeRepresenter.add_representer(str, str_presenter)
        with open(out_filename, 'w', encoding='utf-8') as fh:
            #yaml.dump(configmap, fh, default_flow_style=False, sort_keys=False)
            yaml.dump(configmap, fh, default_flow_style=False)

    def split_list(self, input_list, group_size):
        """Yield successive group_size-sized chunks from input_list."""
        for i in range(0, len(input_list), group_size):
            yield input_list[i:i + group_size]

    def make_config_agg(self, ldmsd_conf, nodes, out_file):
        """Make a new ldmsd config file for each aggregator."""
        if os.path.isfile(out_file):
            logging.info("File already present: %s", out_file)
            return
        # auth data
        sampler = ldmsd_conf.get('sampler')
        auth_type = sampler.get('auth_type')
        auth_secret = sampler.get('auth_secret')
        auth_secret_file = sampler.get('auth_secret_file')
        if auth_type == "munge":
            ldms_auth_option = f"socket=/run/{auth_secret}/munge.socket"
        elif auth_type == "ovis":
            ldms_auth_option = f"conf=/{auth_secret}/{auth_secret_file}"
        else:
            logging.error("Unknown auth_type: %s", auth_type)
            raise ValueError(f"Unknown auth_type: {auth_type}")
        cfg = []
        cfg.append(f"auth_add name={auth_secret} plugin={auth_type}  {ldms_auth_option}")
        cfg.append(
            f"updtr_add name={ldmsd_conf['alias']} interval=10000000 "
            "auto_interval=true  #(Honor hints if true)"
        )
        # Get sampler port from sampler configuration
        sampler_port = sampler.get('port', 10001)
        for node in nodes:
            hsn_node_prefixes = ['nid', 'service', 'workflow', 'login']
            if any(node_prefix in node['hostname'] for node_prefix in hsn_node_prefixes):
                cfg.append(
                    f"prdcr_add name={node['hostname']} host={node['hostaddr']} "
                    f"type=active xprt=sock port={sampler_port} "
                    f"interval=60000000 auth={auth_secret}"
                )
            elif 'ncn-' in node['hostname']:
                cfg.append(
                    f"prdcr_add name={node['hostname']} host={node['hostname']} "
                    f"type=active xprt=sock port={sampler_port} "
                    f"interval=60000000 auth={auth_secret}"
                )
            else:
                cfg.append(
                    f"prdcr_add name={node['hostname']} host={node['ip_address']} "
                    f"type=active xprt=sock port={sampler_port} "
                    f"interval=60000000 auth={auth_secret}"
                )
        cfg.append("prdcr_subscribe stream=nersc regex=.*")
        cfg.append("prdcr_start_regex regex=.*")
        cfg.append(f"updtr_prdcr_add name={ldmsd_conf['alias']} regex=.*")
        cfg.append(
            f"updtr_match_add name={ldmsd_conf['alias']} match=schema "
            "regex=(procnetdev|procstat|vmstat|meminfo|lustre_llite|"
            "lustre2_client|loadavg|dcgm|dvs|proc_group|procdiskstats|"
            "slingshot_metrics|slingshot_info|slurm)"
        )
        cfg.append(f"updtr_start name={ldmsd_conf['alias']}")
        with open(out_file, 'w', encoding='utf-8') as fh:
            fh.write('\n'.join(cfg))

    def make_config_store(self, ldmsd_name, ldmsd_agg_name, ldmsd_agg_port,  # pylint: disable=too-many-arguments,too-many-positional-arguments
                          ldmsd_conf, out_file, split=None):
        """Make a store ldmsd config file for each aggregator."""
        if os.path.isfile(out_file):
            logging.debug("File already present: %s", out_file)
            return
        # auth data
        auth_type = ldmsd_conf.get('auth_type')
        auth_secret = ldmsd_conf.get('auth_secret')
        auth_secret_file = ldmsd_conf.get('auth_secret_file')
        if auth_type == "munge":
            ldms_auth_option = f"socket=/run/{auth_secret}/munge.socket"
        elif auth_type == "ovis":
            ldms_auth_option = f"conf=/{auth_secret}/{auth_secret_file}"
        else:
            ldms_auth_option = ""

        cfg = []
        cfg.append(f"auth_add name={ldmsd_name} plugin={auth_type} {ldms_auth_option}")
        cfg.append(f"prdcr_add name=prdcr_{ldmsd_name} type=active interval=30000000 xprt=sock host={ldmsd_agg_name} port={ldmsd_agg_port} auth={ldmsd_name}")
        if any(prefix in out_file for prefix in ['application', 'gpu', 'management']) and 'store' in out_file:
            cfg.append(f"updtr_add name={ldmsd_name} interval=10000000 auto_interval=true  #(Honor hints if true)")
            cfg.append(f"updtr_prdcr_add name={ldmsd_name} regex=prdcr.*")
        else:
            cfg.append(f"updtr_add name={ldmsd_name} interval=10000000")
            cfg.append(f"updtr_prdcr_add name={ldmsd_name} regex=prdcr.*")
        if split:
            cfg.append(f"updtr_match_add name={ldmsd_name} regex={split}")
        cfg.append(f"updtr_start name={ldmsd_name}")
        cfg.append("prdcr_start_regex regex=.*")
        cfg.extend([
            "# Store in Kafka - port 9093 (TLS with mTLS authentication)",
            "# Uses kafkapump user certificates for mTLS authentication",
            "# Security: TLS encryption + client certificate authentication",
            "#   - TLS port 9093 requires valid client certificates",
            "#   - kafkapump user certificates mounted at /ldms_certs/",
            "#   - Kafka configuration file provides TLS settings",
            "load name=store_avro_kafka",
            "config name=store_avro_kafka encoding=json topic=ldms kafka_conf=/ldms_bin/kafka.conf",
            f"strgp_add name=kafka regex=.* plugin=store_avro_kafka "
            f"container=kafka-kafka-bootstrap.{self.namespace}.svc.cluster.local:9093 "
            "decomposition=/ldms_bin/decomp.json",
            "strgp_start name=kafka"
        ])
        with open(out_file, 'w', encoding='utf-8') as fh:
            fh.write('\n'.join(cfg))
    def make_config_stream2(self, out_file):  # pylint: disable=too-many-locals
        """Make the ldmsd config file for the stream."""
        logging.info("Make Config: stream")
        if os.path.isfile(out_file):
            logging.info("File already present: %s", out_file)
            return
        cfg = []
        #--------
        for ldmsd_name, ldmsd_conf in self.config['node_types'].items():
            # grab auth data
            auth_type = ldmsd_conf.get('auth_type')
            auth_secret = ldmsd_conf.get('auth_secret')
            auth_secret_file = ldmsd_conf.get('auth_secret_file')
            if auth_type == "munge":
                ldms_auth_option = f"socket=/run/{auth_secret}/munge.socket"
            elif auth_type == "ovis":
                ldms_auth_option = f"conf=/{auth_secret}/{auth_secret_file}"
            else:
                ldms_auth_option = ""

            cfg.append(f"auth_add name={ldmsd_name} plugin={auth_type} {ldms_auth_option}")
            ldms_host = f"nersc-ldms-aggr.{self.namespace}.svc.cluster.local"
            for k, v in self.env.items():
                if k == "stream":
                    continue
                for index, sub_list in enumerate(v['agg']):
                    ldmsd_name_i = f"{k}-{index}"
                    ldmsd_port = sub_list['LDMSD_PORT']
                    cfg.append(f"prdcr_add name=prdcr_{ldmsd_name_i} type=active interval=30000000 xprt=sock host={ldms_host} port={ldmsd_port} auth={ldmsd_name}")
        cfg.extend([
            "prdcr_start_regex regex=.*",
            "prdcr_subscribe stream=nersc regex=.*",
            "updtr_add name=stream interval=10000000 auto_interval=true  #(Honor hints if true)",
            "updtr_prdcr_add name=stream regex=prdcr.*",
            "updtr_match_add name=stream match=schema regex=(DONOTMATCH)",
            "updtr_start name=stream",
            "#Log Stream data",
            "load name=hello_sampler",
            "config name=hello_sampler producer=${HOSTNAME} instance=${HOSTNAME}/hello_sampler stream=nersc component_id=1",
            "start name=hello_sampler interval=1000000 offset=0"
        ])
        with open(out_file, 'w', encoding='utf-8') as fh:
            fh.write('\n'.join(cfg))

if __name__ == '__main__':
    parser = argparse.ArgumentParser()
    parser.add_argument(
        "--verbose", "-v", action="store_true", default=False, help="Turn on verbose output"
    )
    parser.add_argument(
        "--config", "-c", default="ldms_machine_config.json", help="Path to JSON config file"
    )
    args = parser.parse_args()
    main_config = load_config(args.config)
    verbose = args.verbose if args.verbose is not None else main_config.get("verbose", False)
    setup_logging(verbose)
    agg = LdmsdManager(main_config)
    agg.main()


================================================
FILE: discovery/roles/telemetry/files/nersc-ldms-aggr/scripts/decomp.json
================================================
{
  "type" : "flex",
  "decomposition" : {
     "dcgm_decomp" : {
       "type" : "static",
       "rows" : [
          {
            "schema" : "dcgm",
            "cols" : [
              { "src" : "timestamp", "dst" : "timestamp", "type" : "ts" },
              { "src" : "producer", "dst":"hostname", "type":"char_array", "array_len":128 },
              { "src" : "instance", "dst":"instance", "type":"char_array", "array_len":128 },
              { "src" : "job_id", "dst" : "job_id", "type" : "u64" },
              { "src" : "app_id", "dst" : "app_id", "type" : "u64" },
              { "src" : "gpu_id", "dst" : "gpu_id", "type" : "s32" },
              { "src" : "sm_clock", "dst" : "sm_clock", "type" : "s64" },
              { "src" : "memory_clock", "dst" : "memory_clock", "type" : "s64" },
              { "src" : "memory_temp", "dst" : "memory_temp", "type" : "s64" },
              { "src" : "gpu_temp", "dst" : "gpu_temp", "type" : "s64" },
              { "src" : "power_usage", "dst" : "power_usage", "type" : "d64" },
              { "src" : "total_energy_consumption", "dst" : "total_energy_consumption", "type" : "s64" },
              { "src" : "slowdown_temp", "dst" : "slowdown_temp", "type" : "s64" },
              { "src" : "shutdown_temp", "dst" : "shutdown_temp", "type" : "s64" },
              { "src" : "pcie_tx_throughput", "dst" : "pcie_tx_throughput", "type" : "s64" },
              { "src" : "pcie_rx_throughput", "dst" : "pcie_rx_throughput", "type" : "s64" },
              { "src" : "pcie_replay_counter", "dst" : "pcie_replay_counter", "type" : "s64" },
              { "src" : "gpu_utilization", "dst" : "gpu_utilization", "type" : "s64" },
              { "src" : "mem_copy_utilization", "dst" : "mem_copy_utilization", "type" : "s64" },
              { "src" : "enc_utilization", "dst" : "enc_utilization", "type" : "s64" },
              { "src" : "dec_utilization", "dst" : "dec_utilization", "type" : "s64" },
              { "src" : "xid_errors", "dst" : "xid_errors", "type" : "s64" },
              { "src" : "pcie_max_link_gen", "dst" : "pcie_max_link_gen", "type" : "s64" },
              { "src" : "pcie_max_link_width", "dst" : "pcie_max_link_width", "type" : "s64" },
              { "src" : "pcie_link_gen", "dst" : "pcie_link_gen", "type" : "s64" },
              { "src" : "pcie_link_width", "dst" : "pcie_link_width", "type" : "s64" },
              { "src" : "power_violation", "dst" : "power_violation", "type" : "s64" },
              { "src" : "thermal_violation", "dst" : "thermal_violation", "type" : "s64" },
              { "src" : "sync_boost_violation", "dst" : "sync_boost_violation", "type" : "s64" },
              { "src" : "board_limit_violation", "dst" : "board_limit_violation", "type" : "s64" },
              { "src" : "low_util_violation", "dst" : "low_util_violation", "type" : "s64" },
              { "src" : "reliability_violation", "dst" : "reliability_violation", "type" : "s64" },
              { "src" : "fb_free", "dst" : "fb_free", "type" : "s64" },
              { "src" : "fb_used", "dst" : "fb_used", "type" : "s64" },
              { "src" : "ecc", "dst" : "ecc", "type" : "s64" },
              { "src" : "ecc_sbe_volatile_total", "dst" : "ecc_sbe_volatile_total", "type" : "s64" },
              { "src" : "ecc_dbe_volatile_total", "dst" : "ecc_dbe_volatile_total", "type" : "s64" },
              { "src" : "ecc_sbe_aggregate_total", "dst" : "ecc_sbe_aggregate_total", "type" : "s64" },
              { "src" : "ecc_dbe_aggregate_total", "dst" : "ecc_dbe_aggregate_total", "type" : "s64" },
              { "src" : "ecc_sbe_volatile_l1", "dst" : "ecc_sbe_volatile_l1", "type" : "s64" },
              { "src" : "retired_pages_sbe", "dst" : "retired_pages_sbe", "type" : "s64" },
              { "src" : "retired_pages_dbe", "dst" : "retired_pages_dbe", "type" : "s64" },
              { "src" : "retired_pages_pending", "dst" : "retired_pages_pending", "type" : "s64" },
              { "src" : "nvlink_flit_crc_error_count_l0", "dst" : "nvlink_flit_crc_error_count_l0", "type" : "s64" },
              { "src" : "nvlink_flit_crc_error_count_l1", "dst" : "nvlink_flit_crc_error_count_l1", "type" : "s64" },
              { "src" : "nvlink_flit_crc_error_count_l2", "dst" : "nvlink_flit_crc_error_count_l2", "type" : "s64" },
              { "src" : "nvlink_flit_crc_error_count_l3", "dst" : "nvlink_flit_crc_error_count_l3", "type" : "s64" },
              { "src" : "nvlink_flit_crc_error_count_total", "dst" : "nvlink_flit_crc_error_count_total", "type" : "s64" },
              { "src" : "nvlink_data_crc_error_count_total", "dst" : "nvlink_data_crc_error_count_total", "type" : "s64" },
              { "src" : "nvlink_replay_error_count_total", "dst" : "nvlink_replay_error_count_total", "type" : "s64" },
              { "src" : "nvlink_recovery_error_count_total", "dst" : "nvlink_recovery_error_count_total", "type" : "s64" },
              { "src" : "nvlink_bandwidth_total", "dst" : "nvlink_bandwidth_total", "type" : "s64" },
              { "src" : "vgpu_instance_license_status", "dst" : "vgpu_instance_license_status", "type" : "s64" },
              { "src" : "uncorrectable_remapped_rows", "dst" : "uncorrectable_remapped_rows", "type" : "s64" },
              { "src" : "correctable_remapped_rows", "dst" : "correctable_remapped_rows", "type" : "s64" },
              { "src" : "row_remap_failure", "dst" : "row_remap_failure", "type" : "s64" },
              { "src" : "gr_engine_active", "dst" : "gr_engine_active", "type" : "d64" },
              { "src" : "sm_active", "dst" : "sm_active", "type" : "d64" },
              { "src" : "sm_occupancy", "dst" : "sm_occupancy", "type" : "d64" },
              { "src" : "tensor_active", "dst" : "tensor_active", "type" : "d64" },
              { "src" : "dram_active", "dst" : "dram_active", "type" : "d64" },
              { "src" : "fp64_active", "dst" : "fp64_active", "type" : "d64" },
              { "src" : "fp32_active", "dst" : "fp32_active", "type" : "d64" },
              { "src" : "fp16_active", "dst" : "fp16_active", "type" : "d64" },
              { "src" : "pcie_tx_bytes", "dst" : "pcie_tx_bytes", "type" : "s64" },
              { "src" : "pcie_rx_bytes", "dst" : "pcie_rx_bytes", "type" : "s64" },
              { "src" : "nvlink_tx_bytes", "dst" : "nvlink_tx_bytes", "type" : "s64" },
              { "src" : "nvlink_rx_bytes", "dst" : "nvlink_rx_bytes", "type" : "s64" },
              { "src" : "tensor_imma_active", "dst" : "tensor_imma_active", "type" : "d64" },
              { "src" : "tensor_hmma_active", "dst" : "tensor_hmma_active", "type" : "d64" }
            ],
            "indices" : [
            ]
         }
      ]
    },
     "loadavg_decomp" : {
       "type" : "static",
       "rows" : [
          {
            "schema" : "loadavg",
            "cols" : [
              { "src" : "timestamp", "dst" : "timestamp", "type" : "ts" },
              { "src" : "producer", "dst":"hostname", "type":"char_array", "array_len":128 },
              { "src" : "instance", "dst":"instance", "type":"char_array", "array_len":128 },
              { "src" : "component_id", "dst" : "component_id", "type" : "u64" },
              { "src" : "job_id", "dst" : "job_id", "type" : "u64" },
              { "src" : "app_id", "dst" : "app_id", "type" : "u64" },
              { "src" : "load1min", "dst" : "load1min", "type" : "d64" },
              { "src" : "load5min", "dst" : "load5min", "type" : "d64" },
              { "src" : "load15min", "dst" : "load15min", "type" : "d64" },
              { "src" : "runnable", "dst" : "runnable", "type" : "u64" },
              { "src" : "scheduling_entities", "dst" : "scheduling_entities", "type" : "u64" },
              { "src" : "newest_pid", "dst" : "newest_pid", "type" : "u64" }
            ],
            "indices" : [
            ]
         }
      ]
    },
     "lustre_llite_decomp" : {
       "type" : "static",
       "rows" : [
          {
            "schema" : "lustre_llite",
            "cols" : [
              { "src" : "timestamp", "dst" : "timestamp", "type" : "ts" },
              { "src" : "producer", "dst":"hostname", "type":"char_array", "array_len":128 },
              { "src" : "instance", "dst":"instance", "type":"char_array", "array_len":128 },
              { "src" : "component_id", "dst" : "component_id", "type" : "u64" },
              { "src" : "job_id", "dst" : "job_id", "type" : "u64" },
              { "src" : "app_id", "dst" : "app_id", "type" : "u64" }
            ],
            "indices" : [
            ]
         }
      ]
    },
     "meminfo_decomp" : {
       "type" : "static",
       "rows" : [
          {
            "schema" : "meminfo",
            "cols" : [
              { "src" : "timestamp", "dst" : "timestamp", "type" : "ts" },
              { "src" : "producer", "dst":"hostname", "type":"char_array", "array_len":128 },
              { "src" : "instance", "dst":"instance", "type":"char_array", "array_len":128 },
              { "src" : "component_id", "dst" : "component_id", "type" : "u64" },
              { "src" : "job_id", "dst" : "job_id", "type" : "u64" },
              { "src" : "app_id", "dst" : "app_id", "type" : "u64" },
              { "src" : "MemTotal", "dst" : "MemTotal", "type" : "u64" },
              { "src" : "MemFree", "dst" : "MemFree", "type" : "u64" },
              { "src" : "MemAvailable", "dst" : "MemAvailable", "type" : "u64" },
              { "src" : "Buffers", "dst" : "Buffers", "type" : "u64" },
              { "src" : "Cached", "dst" : "Cached", "type" : "u64" },
              { "src" : "SwapCached", "dst" : "SwapCached", "type" : "u64" },
              { "src" : "Active", "dst" : "Active", "type" : "u64" },
              { "src" : "Inactive", "dst" : "Inactive", "type" : "u64" },
              { "src" : "Active(anon)", "dst" : "Active(anon)", "type" : "u64" },
              { "src" : "Inactive(anon)", "dst" : "Inactive(anon)", "type" : "u64" },
              { "src" : "Active(file)", "dst" : "Active(file)", "type" : "u64" },
              { "src" : "Inactive(file)", "dst" : "Inactive(file)", "type" : "u64" },
              { "src" : "Unevictable", "dst" : "Unevictable", "type" : "u64" },
              { "src" : "Mlocked", "dst" : "Mlocked", "type" : "u64" },
              { "src" : "SwapTotal", "dst" : "SwapTotal", "type" : "u64" },
              { "src" : "SwapFree", "dst" : "SwapFree", "type" : "u64" },
              { "src" : "Zswap", "dst" : "Zswap", "type" : "u64" },
              { "src" : "Zswapped", "dst" : "Zswapped", "type" : "u64" },
              { "src" : "Dirty", "dst" : "Dirty", "type" : "u64" },
              { "src" : "Writeback", "dst" : "Writeback", "type" : "u64" },
              { "src" : "AnonPages", "dst" : "AnonPages", "type" : "u64" },
              { "src" : "Mapped", "dst" : "Mapped", "type" : "u64" },
              { "src" : "Shmem", "dst" : "Shmem", "type" : "u64" },
              { "src" : "KReclaimable", "dst" : "KReclaimable", "type" : "u64" },
              { "src" : "Slab", "dst" : "Slab", "type" : "u64" },
              { "src" : "SReclaimable", "dst" : "SReclaimable", "type" : "u64" },
              { "src" : "SUnreclaim", "dst" : "SUnreclaim", "type" : "u64" },
              { "src" : "KernelStack", "dst" : "KernelStack", "type" : "u64" },
              { "src" : "PageTables", "dst" : "PageTables", "type" : "u64" },
              { "src" : "SecPageTables", "dst" : "SecPageTables", "type" : "u64" },
              { "src" : "NFS_Unstable", "dst" : "NFS_Unstable", "type" : "u64" },
              { "src" : "Bounce", "dst" : "Bounce", "type" : "u64" },
              { "src" : "WritebackTmp", "dst" : "WritebackTmp", "type" : "u64" },
              { "src" : "CommitLimit", "dst" : "CommitLimit", "type" : "u64" },
              { "src" : "Committed_AS", "dst" : "Committed_AS", "type" : "u64" },
              { "src" : "VmallocTotal", "dst" : "VmallocTotal", "type" : "u64" },
              { "src" : "VmallocUsed", "dst" : "VmallocUsed", "type" : "u64" },
              { "src" : "VmallocChunk", "dst" : "VmallocChunk", "type" : "u64" },
              { "src" : "Percpu", "dst" : "Percpu", "type" : "u64" },
              { "src" : "HardwareCorrupted", "dst" : "HardwareCorrupted", "type" : "u64" },
              { "src" : "AnonHugePages", "dst" : "AnonHugePages", "type" : "u64" },
              { "src" : "ShmemHugePages", "dst" : "ShmemHugePages", "type" : "u64" },
              { "src" : "ShmemPmdMapped", "dst" : "ShmemPmdMapped", "type" : "u64" },
              { "src" : "FileHugePages", "dst" : "FileHugePages", "type" : "u64" },
              { "src" : "FilePmdMapped", "dst" : "FilePmdMapped", "type" : "u64" },
              { "src" : "CmaTotal", "dst" : "CmaTotal", "type" : "u64" },
              { "src" : "CmaFree", "dst" : "CmaFree", "type" : "u64" },
              { "src" : "Unaccepted", "dst" : "Unaccepted", "type" : "u64", "fill" : 0 },
              { "src" : "HugePages_Total", "dst" : "HugePages_Total", "type" : "u64" },
              { "src" : "HugePages_Free", "dst" : "HugePages_Free", "type" : "u64" },
              { "src" : "HugePages_Rsvd", "dst" : "HugePages_Rsvd", "type" : "u64" },
              { "src" : "HugePages_Surp", "dst" : "HugePages_Surp", "type" : "u64" },
              { "src" : "Hugepagesize", "dst" : "Hugepagesize", "type" : "u64" },
              { "src" : "Hugetlb", "dst" : "Hugetlb", "type" : "u64" },
              { "src" : "DirectMap4k", "dst" : "DirectMap4k", "type" : "u64", "fill" : 0 },
              { "src" : "DirectMap2M", "dst" : "DirectMap2M", "type" : "u64", "fill" : 0 },
              { "src" : "DirectMap1G", "dst" : "DirectMap1G", "type" : "u64", "fill" : 0 }
            ],
            "indices" : [
            ]
         }
      ]
    },
     "procnetdev2_decomp" : {
       "type" : "static",
       "rows" : [
          {
            "schema" : "procnetdev2",
            "cols" : [
              { "src" : "timestamp", "dst" : "timestamp", "type" : "ts" },
              { "src" : "producer", "dst":"hostname", "type":"char_array", "array_len":128 },
              { "src" : "instance", "dst":"instance", "type":"char_array", "array_len":128 },
              { "src" : "component_id", "dst" : "component_id", "type" : "u64" },
              { "src" : "job_id", "dst" : "job_id", "type" : "u64" },
              { "src" : "app_id", "dst" : "app_id", "type" : "u64" },
              { "src" : "netdev_list", "rec_member" : "name", "dst" : "name", "type" : "char[]", "array_len" : 16 },
              { "src" : "netdev_list", "rec_member" : "rx_bytes", "dst" : "rx_bytes", "type" : "u64" },
              { "src" : "netdev_list", "rec_member" : "rx_packets", "dst" : "rx_packets", "type" : "u64" },
              { "src" : "netdev_list", "rec_member" : "rx_errs", "dst" : "rx_errs", "type" : "u64" },
              { "src" : "netdev_list", "rec_member" : "rx_drop", "dst" : "rx_drop", "type" : "u64" },
              { "src" : "netdev_list", "rec_member" : "rx_fifo", "dst" : "rx_fifo", "type" : "u64" },
              { "src" : "netdev_list", "rec_member" : "rx_frame", "dst" : "rx_frame", "type" : "u64" },
              { "src" : "netdev_list", "rec_member" : "rx_compressed", "dst" : "rx_compressed", "type" : "u64" },
              { "src" : "netdev_list", "rec_member" : "rx_multicast", "dst" : "rx_multicast", "type" : "u64" },
              { "src" : "netdev_list", "rec_member" : "tx_bytes", "dst" : "tx_bytes", "type" : "u64" },
              { "src" : "netdev_list", "rec_member" : "tx_packets", "dst" : "tx_packets", "type" : "u64" },
              { "src" : "netdev_list", "rec_member" : "tx_errs", "dst" : "tx_errs", "type" : "u64" },
              { "src" : "netdev_list", "rec_member" : "tx_drop", "dst" : "tx_drop", "type" : "u64" },
              { "src" : "netdev_list", "rec_member" : "tx_fifo", "dst" : "tx_fifo", "type" : "u64" },
              { "src" : "netdev_list", "rec_member" : "tx_colls", "dst" : "tx_colls", "type" : "u64" },
              { "src" : "netdev_list", "rec_member" : "tx_carrier", "dst" : "tx_carrier", "type" : "u64" },
              { "src" : "netdev_list", "rec_member" : "tx_compressed", "dst" : "tx_compressed", "type" : "u64" }

            ],
            "indices" : [
            ]
         }
      ]
    },
     "procstat2_decomp" : {
       "type" : "static",
       "rows" : [
          {
            "schema" : "procstat2",
            "cols" : [
              { "src" : "timestamp", "dst" : "timestamp", "type" : "ts" },
              { "src" : "producer", "dst":"hostname", "type":"char_array", "array_len":128 },
              { "src" : "instance", "dst":"instance", "type":"char_array", "array_len":128 },
              { "src" : "component_id", "dst" : "component_id", "type" : "u64" },
              { "src" : "job_id", "dst" : "job_id", "type" : "u64" },
              { "src" : "app_id", "dst" : "app_id", "type" : "u64" },
              { "src" : "cpu_list", "rec_member" : "name", "dst" : "name", "type" : "char[]", "array_len" : 8 },
              { "src" : "cpu_list", "rec_member" : "user", "dst" : "user", "type" : "u64" },
              { "src" : "cpu_list", "rec_member" : "nice", "dst" : "nice", "type" : "u64" },
              { "src" : "cpu_list", "rec_member" : "system", "dst" : "system", "type" : "u64" },
              { "src" : "cpu_list", "rec_member" : "idle", "dst" : "idle", "type" : "u64" },
              { "src" : "cpu_list", "rec_member" : "iowait", "dst" : "iowait", "type" : "u64" },
              { "src" : "cpu_list", "rec_member" : "irq", "dst" : "irq", "type" : "u64" },
              { "src" : "cpu_list", "rec_member" : "softirq", "dst" : "softirq", "type" : "u64" },
              { "src" : "cpu_list", "rec_member" : "steal", "dst" : "steal", "type" : "u64" },
              { "src" : "cpu_list", "rec_member" : "guest", "dst" : "guest", "type" : "u64" },
              { "src" : "cpu_list", "rec_member" : "guest_nice", "dst" : "guest_nice", "type" : "u64" }
,
              { "src" : "ctxt", "dst" : "ctxt", "type" : "u64" },
              { "src" : "btime", "dst" : "btime", "type" : "u64" },
              { "src" : "processes", "dst" : "processes", "type" : "u64" },
              { "src" : "procs_running", "dst" : "procs_running", "type" : "u64" },
              { "src" : "procs_blocked", "dst" : "procs_blocked", "type" : "u64" }
            ],
            "indices" : [
            ]
         }
      ]
    },
     "slingshot_info_decomp" : {
       "type" : "static",
       "rows" : [
          {
            "schema" : "slingshot_info",
            "cols" : [
              { "src" : "timestamp", "dst" : "timestamp", "type" : "ts" },
              { "src" : "producer", "dst":"hostname", "type":"char_array", "array_len":128 },
              { "src" : "instance", "dst":"instance", "type":"char_array", "array_len":128 },
              { "src" : "component_id", "dst" : "component_id", "type" : "u64" },
              { "src" : "job_id", "dst" : "job_id", "type" : "u64" },
              { "src" : "app_id", "dst" : "app_id", "type" : "u64" },
              { "src" : "nics", "rec_member" : "name", "dst" : "name", "type" : "char[]", "array_len" : 14 },
              { "src" : "nics", "rec_member" : "interface", "dst" : "interface", "type" : "char[]", "array_len" : 16 },
              { "src" : "nics", "rec_member" : "fru_description", "dst" : "fru_description", "type" : "char[]", "array_len" : 17 },
              { "src" : "nics", "rec_member" : "part_number", "dst" : "part_number", "type" : "char[]", "array_len" : 32 },
              { "src" : "nics", "rec_member" : "serial_number", "dst" : "serial_number", "type" : "char[]", "array_len" : 32 },
              { "src" : "nics", "rec_member" : "firmware_version", "dst" : "firmware_version", "type" : "char[]", "array_len" : 32 },
              { "src" : "nics", "rec_member" : "mac", "dst" : "mac", "type" : "char[]", "array_len" : 32 },
              { "src" : "nics", "rec_member" : "nid", "dst" : "nid", "type" : "u32" },
              { "src" : "nics", "rec_member" : "pid_granule", "dst" : "pid_granule", "type" : "u32" },
              { "src" : "nics", "rec_member" : "pcie_speed", "dst" : "pcie_speed", "type" : "char[]", "array_len" : 32 },
              { "src" : "nics", "rec_member" : "pcie_slot", "dst" : "pcie_slot", "type" : "char[]", "array_len" : 32 },
              { "src" : "nics", "rec_member" : "link_layer_retry", "dst" : "link_layer_retry", "type" : "char[]", "array_len" : 32 },
              { "src" : "nics", "rec_member" : "link_loopback", "dst" : "link_loopback", "type" : "char[]", "array_len" : 32 },
              { "src" : "nics", "rec_member" : "link_media", "dst" : "link_media", "type" : "char[]", "array_len" : 32 },
              { "src" : "nics", "rec_member" : "link_mtu", "dst" : "link_mtu", "type" : "u32" },
              { "src" : "nics", "rec_member" : "link_speed", "dst" : "link_speed", "type" : "char[]", "array_len" : 32 },
              { "src" : "nics", "rec_member" : "link_state", "dst" : "link_state", "type" : "char[]", "array_len" : 32 }

            ],
            "indices" : [
            ]
         }
      ]
    },
     "slingshot_metrics_decomp" : {
       "type" : "static",
       "rows" : [
          {
            "schema" : "slingshot_metrics",
            "cols" : [
              { "src" : "timestamp", "dst" : "timestamp", "type" : "ts" },
              { "src" : "producer", "dst":"hostname", "type":"char_array", "array_len":128 },
              { "src" : "instance", "dst":"instance", "type":"char_array", "array_len":128 },
              { "src" : "component_id", "dst" : "component_id", "type" : "u64" },
              { "src" : "job_id", "dst" : "job_id", "type" : "u64" },
              { "src" : "app_id", "dst" : "app_id", "type" : "u64" },
              { "src" : "nics", "rec_member" : "name", "dst" : "name", "type" : "char[]", "array_len" : 14 },
              { "src" : "nics", "rec_member" : "hni_llr_rx_replay_event", "dst" : "hni_llr_rx_replay_event", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_llr_tx_replay_event", "dst" : "hni_llr_tx_replay_event", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_multicast_pkts_recv_by_tc_0", "dst" : "hni_multicast_pkts_recv_by_tc_0", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_multicast_pkts_recv_by_tc_1", "dst" : "hni_multicast_pkts_recv_by_tc_1", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_multicast_pkts_recv_by_tc_2", "dst" : "hni_multicast_pkts_recv_by_tc_2", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_multicast_pkts_recv_by_tc_3", "dst" : "hni_multicast_pkts_recv_by_tc_3", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_multicast_pkts_recv_by_tc_4", "dst" : "hni_multicast_pkts_recv_by_tc_4", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_multicast_pkts_recv_by_tc_5", "dst" : "hni_multicast_pkts_recv_by_tc_5", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_multicast_pkts_recv_by_tc_6", "dst" : "hni_multicast_pkts_recv_by_tc_6", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_multicast_pkts_recv_by_tc_7", "dst" : "hni_multicast_pkts_recv_by_tc_7", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_multicast_pkts_sent_by_tc_0", "dst" : "hni_multicast_pkts_sent_by_tc_0", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_multicast_pkts_sent_by_tc_1", "dst" : "hni_multicast_pkts_sent_by_tc_1", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_multicast_pkts_sent_by_tc_2", "dst" : "hni_multicast_pkts_sent_by_tc_2", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_multicast_pkts_sent_by_tc_3", "dst" : "hni_multicast_pkts_sent_by_tc_3", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_multicast_pkts_sent_by_tc_4", "dst" : "hni_multicast_pkts_sent_by_tc_4", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_multicast_pkts_sent_by_tc_5", "dst" : "hni_multicast_pkts_sent_by_tc_5", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_multicast_pkts_sent_by_tc_6", "dst" : "hni_multicast_pkts_sent_by_tc_6", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_multicast_pkts_sent_by_tc_7", "dst" : "hni_multicast_pkts_sent_by_tc_7", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_pcs_corrected_cw", "dst" : "hni_pcs_corrected_cw", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_pcs_good_cw", "dst" : "hni_pcs_good_cw", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_pcs_uncorrected_cw", "dst" : "hni_pcs_uncorrected_cw", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_pkts_sent_by_tc_0", "dst" : "hni_pkts_sent_by_tc_0", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_pkts_sent_by_tc_1", "dst" : "hni_pkts_sent_by_tc_1", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_pkts_sent_by_tc_2", "dst" : "hni_pkts_sent_by_tc_2", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_pkts_sent_by_tc_3", "dst" : "hni_pkts_sent_by_tc_3", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_pkts_sent_by_tc_4", "dst" : "hni_pkts_sent_by_tc_4", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_pkts_sent_by_tc_5", "dst" : "hni_pkts_sent_by_tc_5", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_pkts_sent_by_tc_6", "dst" : "hni_pkts_sent_by_tc_6", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_pkts_sent_by_tc_7", "dst" : "hni_pkts_sent_by_tc_7", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_pkts_recv_by_tc_0", "dst" : "hni_pkts_recv_by_tc_0", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_pkts_recv_by_tc_1", "dst" : "hni_pkts_recv_by_tc_1", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_pkts_recv_by_tc_2", "dst" : "hni_pkts_recv_by_tc_2", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_pkts_recv_by_tc_3", "dst" : "hni_pkts_recv_by_tc_3", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_pkts_recv_by_tc_4", "dst" : "hni_pkts_recv_by_tc_4", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_pkts_recv_by_tc_5", "dst" : "hni_pkts_recv_by_tc_5", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_pkts_recv_by_tc_6", "dst" : "hni_pkts_recv_by_tc_6", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_pkts_recv_by_tc_7", "dst" : "hni_pkts_recv_by_tc_7", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_rx_paused_0", "dst" : "hni_rx_paused_0", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_rx_paused_1", "dst" : "hni_rx_paused_1", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_rx_paused_2", "dst" : "hni_rx_paused_2", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_rx_paused_3", "dst" : "hni_rx_paused_3", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_rx_paused_4", "dst" : "hni_rx_paused_4", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_rx_paused_5", "dst" : "hni_rx_paused_5", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_rx_paused_6", "dst" : "hni_rx_paused_6", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_rx_paused_7", "dst" : "hni_rx_paused_7", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_rx_paused_std", "dst" : "hni_rx_paused_std", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_tx_paused_0", "dst" : "hni_tx_paused_0", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_tx_paused_1", "dst" : "hni_tx_paused_1", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_tx_paused_2", "dst" : "hni_tx_paused_2", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_tx_paused_3", "dst" : "hni_tx_paused_3", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_tx_paused_4", "dst" : "hni_tx_paused_4", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_tx_paused_5", "dst" : "hni_tx_paused_5", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_tx_paused_6", "dst" : "hni_tx_paused_6", "type" : "u64" },
              { "src" : "nics", "rec_member" : "hni_tx_paused_7", "dst" : "hni_tx_paused_7", "type" : "u64" },
              { "src" : "nics", "rec_member" : "parbs_tarb_pi_non_posted_blocked_cnt", "dst" : "parbs_tarb_pi_non_posted_blocked_cnt", "type" : "u64" },
              { "src" : "nics", "rec_member" : "parbs_tarb_pi_non_posted_pkts", "dst" : "parbs_tarb_pi_non_posted_pkts", "type" : "u64" },
              { "src" : "nics", "rec_member" : "parbs_tarb_pi_posted_blocked_cnt", "dst" : "parbs_tarb_pi_posted_blocked_cnt", "type" : "u64" },
              { "src" : "nics", "rec_member" : "parbs_tarb_pi_posted_pkts", "dst" : "parbs_tarb_pi_posted_pkts", "type" : "u64" },
              { "src" : "nics", "rec_member" : "pct_sct_timeouts", "dst" : "pct_sct_timeouts", "type" : "u64" },
              { "src" : "nics", "rec_member" : "pct_spt_timeouts", "dst" : "pct_spt_timeouts", "type" : "u64" },
              { "src" : "nics", "rec_member" : "pct_tct_timeouts", "dst" : "pct_tct_timeouts", "type" : "u64" },
              { "src" : "nics", "rec_member" : "pct_trs_replay_pend_drops", "dst" : "pct_trs_replay_pend_drops", "type" : "u64" }

            ],
            "indices" : [
            ]
         }
      ]
    },
     "vmstat_decomp" : {
       "type" : "static",
       "rows" : [
          {
            "schema" : "vmstat",
            "cols" : [
              { "src" : "timestamp", "dst" : "timestamp", "type" : "ts" },
              { "src" : "producer", "dst":"hostname", "type":"char_array", "array_len":128 },
              { "src" : "instance", "dst":"instance", "type":"char_array", "array_len":128 },
              { "src" : "component_id", "dst" : "component_id", "type" : "u64" },
              { "src" : "job_id", "dst" : "job_id", "type" : "u64" },
              { "src" : "app_id", "dst" : "app_id", "type" : "u64" },
              { "src" : "nr_free_pages", "dst" : "nr_free_pages", "type" : "u64" },
              { "src" : "nr_zone_inactive_anon", "dst" : "nr_zone_inactive_anon", "type" : "u64" },
              { "src" : "nr_zone_active_anon", "dst" : "nr_zone_active_anon", "type" : "u64" },
              { "src" : "nr_zone_inactive_file", "dst" : "nr_zone_inactive_file", "type" : "u64" },
              { "src" : "nr_zone_active_file", "dst" : "nr_zone_active_file", "type" : "u64" },
              { "src" : "nr_zone_unevictable", "dst" : "nr_zone_unevictable", "type" : "u64" },
              { "src" : "nr_zone_write_pending", "dst" : "nr_zone_write_pending", "type" : "u64" },
              { "src" : "nr_mlock", "dst" : "nr_mlock", "type" : "u64" },
              { "src" : "nr_bounce", "dst" : "nr_bounce", "type" : "u64" },
              { "src" : "nr_zspages", "dst" : "nr_zspages", "type" : "u64" },
              { "src" : "nr_free_cma", "dst" : "nr_free_cma", "type" : "u64" },
              { "src" : "numa_hit", "dst" : "numa_hit", "type" : "u64" },
              { "src" : "numa_miss", "dst" : "numa_miss", "type" : "u64" },
              { "src" : "numa_foreign", "dst" : "numa_foreign", "type" : "u64" },
              { "src" : "numa_interleave", "dst" : "numa_interleave", "type" : "u64" },
              { "src" : "numa_local", "dst" : "numa_local", "type" : "u64" },
              { "src" : "numa_other", "dst" : "numa_other", "type" : "u64" },
              { "src" : "nr_inactive_anon", "dst" : "nr_inactive_anon", "type" : "u64" },
              { "src" : "nr_active_anon", "dst" : "nr_active_anon", "type" : "u64" },
              { "src" : "nr_inactive_file", "dst" : "nr_inactive_file", "type" : "u64" },
              { "src" : "nr_active_file", "dst" : "nr_active_file", "type" : "u64" },
              { "src" : "nr_unevictable", "dst" : "nr_unevictable", "type" : "u64" },
              { "src" : "nr_slab_reclaimable", "dst" : "nr_slab_reclaimable", "type" : "u64" },
              { "src" : "nr_slab_unreclaimable", "dst" : "nr_slab_unreclaimable", "type" : "u64" },
              { "src" : "nr_isolated_anon", "dst" : "nr_isolated_anon", "type" : "u64" },
              { "src" : "nr_isolated_file", "dst" : "nr_isolated_file", "type" : "u64" },
              { "src" : "workingset_nodes", "dst" : "workingset_nodes", "type" : "u64" },
              { "src" : "workingset_refault_anon", "dst" : "workingset_refault_anon", "type" : "u64" },
              { "src" : "workingset_refault_file", "dst" : "workingset_refault_file", "type" : "u64" },
              { "src" : "workingset_activate_anon", "dst" : "workingset_activate_anon", "type" : "u64" },
              { "src" : "workingset_activate_file", "dst" : "workingset_activate_file", "type" : "u64" },
              { "src" : "workingset_restore_anon", "dst" : "workingset_restore_anon", "type" : "u64" },
              { "src" : "workingset_restore_file", "dst" : "workingset_restore_file", "type" : "u64" },
              { "src" : "workingset_nodereclaim", "dst" : "workingset_nodereclaim", "type" : "u64" },
              { "src" : "nr_anon_pages", "dst" : "nr_anon_pages", "type" : "u64" },
              { "src" : "nr_mapped", "dst" : "nr_mapped", "type" : "u64" },
              { "src" : "nr_file_pages", "dst" : "nr_file_pages", "type" : "u64" },
              { "src" : "nr_dirty", "dst" : "nr_dirty", "type" : "u64" },
              { "src" : "nr_writeback", "dst" : "nr_writeback", "type" : "u64" },
              { "src" : "nr_writeback_temp", "dst" : "nr_writeback_temp", "type" : "u64" },
              { "src" : "nr_shmem", "dst" : "nr_shmem", "type" : "u64" },
              { "src" : "nr_shmem_hugepages", "dst" : "nr_shmem_hugepages", "type" : "u64" },
              { "src" : "nr_shmem_pmdmapped", "dst" : "nr_shmem_pmdmapped", "type" : "u64" },
              { "src" : "nr_file_hugepages", "dst" : "nr_file_hugepages", "type" : "u64" },
              { "src" : "nr_file_pmdmapped", "dst" : "nr_file_pmdmapped", "type" : "u64" },
              { "src" : "nr_anon_transparent_hugepages", "dst" : "nr_anon_transparent_hugepages", "type" : "u64" },
              { "src" : "nr_vmscan_write", "dst" : "nr_vmscan_write", "type" : "u64" },
              { "src" : "nr_vmscan_immediate_reclaim", "dst" : "nr_vmscan_immediate_reclaim", "type" : "u64" },
              { "src" : "nr_dirtied", "dst" : "nr_dirtied", "type" : "u64" },
              { "src" : "nr_written", "dst" : "nr_written", "type" : "u64" },
              { "src" : "nr_throttled_written", "dst" : "nr_throttled_written", "type" : "u64" },
              { "src" : "nr_kernel_misc_reclaimable", "dst" : "nr_kernel_misc_reclaimable", "type" : "u64" },
              { "src" : "nr_foll_pin_acquired", "dst" : "nr_foll_pin_acquired", "type" : "u64" },
              { "src" : "nr_foll_pin_released", "dst" : "nr_foll_pin_released", "type" : "u64" },
              { "src" : "nr_kernel_stack", "dst" : "nr_kernel_stack", "type" : "u64" },
              { "src" : "nr_page_table_pages", "dst" : "nr_page_table_pages", "type" : "u64" },
              { "src" : "nr_sec_page_table_pages", "dst" : "nr_sec_page_table_pages", "type" : "u64" },
              { "src" : "nr_iommu_pages", "dst" : "nr_iommu_pages", "type" : "u64" },
              { "src" : "nr_swapcached", "dst" : "nr_swapcached", "type" : "u64" },
              { "src" : "pgpromote_success", "dst" : "pgpromote_success", "type" : "u64" },
              { "src" : "pgpromote_candidate", "dst" : "pgpromote_candidate", "type" : "u64" },
              { "src" : "pgdemote_kswapd", "dst" : "pgdemote_kswapd", "type" : "u64" },
              { "src" : "pgdemote_direct", "dst" : "pgdemote_direct", "type" : "u64" },
              { "src" : "pgdemote_khugepaged", "dst" : "pgdemote_khugepaged", "type" : "u64" },
              { "src" : "nr_dirty_threshold", "dst" : "nr_dirty_threshold", "type" : "u64" },
              { "src" : "nr_dirty_background_threshold", "dst" : "nr_dirty_background_threshold", "type" : "u64" },
              { "src" : "nr_memmap_pages", "dst" : "nr_memmap_pages", "type" : "u64" },
              { "src" : "nr_memmap_boot_pages", "dst" : "nr_memmap_boot_pages", "type" : "u64" },
              { "src" : "pgpgin", "dst" : "pgpgin", "type" : "u64" },
              { "src" : "pgpgout", "dst" : "pgpgout", "type" : "u64" },
              { "src" : "pswpin", "dst" : "pswpin", "type" : "u64" },
              { "src" : "pswpout", "dst" : "pswpout", "type" : "u64" },
              { "src" : "pgalloc_dma", "dst" : "pgalloc_dma", "type" : "u64" },
              { "src" : "pgalloc_dma32", "dst" : "pgalloc_dma32", "type" : "u64" },
              { "src" : "pgalloc_normal", "dst" : "pgalloc_normal", "type" : "u64" },
              { "src" : "pgalloc_movable", "dst" : "pgalloc_movable", "type" : "u64" },
              { "src" : "pgalloc_device", "dst" : "pgalloc_device", "type" : "u64" },
              { "src" : "allocstall_dma", "dst" : "allocstall_dma", "type" : "u64" },
              { "src" : "allocstall_dma32", "dst" : "allocstall_dma32", "type" : "u64" },
              { "src" : "allocstall_normal", "dst" : "allocstall_normal", "type" : "u64" },
              { "src" : "allocstall_movable", "dst" : "allocstall_movable", "type" : "u64" },
              { "src" : "allocstall_device", "dst" : "allocstall_device", "type" : "u64" },
              { "src" : "pgskip_dma", "dst" : "pgskip_dma", "type" : "u64" },
              { "src" : "pgskip_dma32", "dst" : "pgskip_dma32", "type" : "u64" },
              { "src" : "pgskip_normal", "dst" : "pgskip_normal", "type" : "u64" },
              { "src" : "pgskip_movable", "dst" : "pgskip_movable", "type" : "u64" },
              { "src" : "pgskip_device", "dst" : "pgskip_device", "type" : "u64" },
              { "src" : "pgfree", "dst" : "pgfree", "type" : "u64" },
              { "src" : "pgactivate", "dst" : "pgactivate", "type" : "u64" },
              { "src" : "pgdeactivate", "dst" : "pgdeactivate", "type" : "u64" },
              { "src" : "pglazyfree", "dst" : "pglazyfree", "type" : "u64" },
              { "src" : "pgfault", "dst" : "pgfault", "type" : "u64" },
              { "src" : "pgmajfault", "dst" : "pgmajfault", "type" : "u64" },
              { "src" : "pglazyfreed", "dst" : "pglazyfreed", "type" : "u64" },
              { "src" : "pgrefill", "dst" : "pgrefill", "type" : "u64" },
              { "src" : "pgreuse", "dst" : "pgreuse", "type" : "u64" },
              { "src" : "pgsteal_kswapd", "dst" : "pgsteal_kswapd", "type" : "u64" },
              { "src" : "pgsteal_direct", "dst" : "pgsteal_direct", "type" : "u64" },
              { "src" : "pgsteal_khugepaged", "dst" : "pgsteal_khugepaged", "type" : "u64" },
              { "src" : "pgscan_kswapd", "dst" : "pgscan_kswapd", "type" : "u64" },
              { "src" : "pgscan_direct", "dst" : "pgscan_direct", "type" : "u64" },
              { "src" : "pgscan_khugepaged", "dst" : "pgscan_khugepaged", "type" : "u64" },
              { "src" : "pgscan_direct_throttle", "dst" : "pgscan_direct_throttle", "type" : "u64" },
              { "src" : "pgscan_anon", "dst" : "pgscan_anon", "type" : "u64" },
              { "src" : "pgscan_file", "dst" : "pgscan_file", "type" : "u64" },
              { "src" : "pgsteal_anon", "dst" : "pgsteal_anon", "type" : "u64" },
              { "src" : "pgsteal_file", "dst" : "pgsteal_file", "type" : "u64" },
              { "src" : "zone_reclaim_success", "dst" : "zone_reclaim_success", "type" : "u64" },
              { "src" : "zone_reclaim_failed", "dst" : "zone_reclaim_failed", "type" : "u64" },
              { "src" : "pginodesteal", "dst" : "pginodesteal", "type" : "u64" },
              { "src" : "slabs_scanned", "dst" : "slabs_scanned", "type" : "u64" },
              { "src" : "kswapd_inodesteal", "dst" : "kswapd_inodesteal", "type" : "u64" },
              { "src" : "kswapd_low_wmark_hit_quickly", "dst" : "kswapd_low_wmark_hit_quickly", "type" : "u64" },
              { "src" : "kswapd_high_wmark_hit_quickly", "dst" : "kswapd_high_wmark_hit_quickly", "type" : "u64" },
              { "src" : "pageoutrun", "dst" : "pageoutrun", "type" : "u64" },
              { "src" : "pgrotated", "dst" : "pgrotated", "type" : "u64" },
              { "src" : "drop_pagecache", "dst" : "drop_pagecache", "type" : "u64" },
              { "src" : "drop_slab", "dst" : "drop_slab", "type" : "u64" },
              { "src" : "oom_kill", "dst" : "oom_kill", "type" : "u64" },
              { "src" : "numa_pte_updates", "dst" : "numa_pte_updates", "type" : "u64" },
              { "src" : "numa_huge_pte_updates", "dst" : "numa_huge_pte_updates", "type" : "u64" },
              { "src" : "numa_hint_faults", "dst" : "numa_hint_faults", "type" : "u64" },
              { "src" : "numa_hint_faults_local", "dst" : "numa_hint_faults_local", "type" : "u64" },
              { "src" : "numa_pages_migrated", "dst" : "numa_pages_migrated", "type" : "u64" },
              { "src" : "pgmigrate_success", "dst" : "pgmigrate_success", "type" : "u64" },
              { "src" : "pgmigrate_fail", "dst" : "pgmigrate_fail", "type" : "u64" },
              { "src" : "thp_migration_success", "dst" : "thp_migration_success", "type" : "u64" },
              { "src" : "thp_migration_fail", "dst" : "thp_migration_fail", "type" : "u64" },
              { "src" : "thp_migration_split", "dst" : "thp_migration_split", "type" : "u64" },
              { "src" : "compact_migrate_scanned", "dst" : "compact_migrate_scanned", "type" : "u64" },
              { "src" : "compact_free_scanned", "dst" : "compact_free_scanned", "type" : "u64" },
              { "src" : "compact_isolated", "dst" : "compact_isolated", "type" : "u64" },
              { "src" : "compact_stall", "dst" : "compact_stall", "type" : "u64" },
              { "src" : "compact_fail", "dst" : "compact_fail", "type" : "u64" },
              { "src" : "compact_success", "dst" : "compact_success", "type" : "u64" },
              { "src" : "compact_daemon_wake", "dst" : "compact_daemon_wake", "type" : "u64" },
              { "src" : "compact_daemon_migrate_scanned", "dst" : "compact_daemon_migrate_scanned", "type" : "u64" },
              { "src" : "compact_daemon_free_scanned", "dst" : "compact_daemon_free_scanned", "type" : "u64" },
              { "src" : "htlb_buddy_alloc_success", "dst" : "htlb_buddy_alloc_success", "type" : "u64" },
              { "src" : "htlb_buddy_alloc_fail", "dst" : "htlb_buddy_alloc_fail", "type" : "u64" },
              { "src" : "cma_alloc_success", "dst" : "cma_alloc_success", "type" : "u64" },
              { "src" : "cma_alloc_fail", "dst" : "cma_alloc_fail", "type" : "u64" },
              { "src" : "unevictable_pgs_culled", "dst" : "unevictable_pgs_culled", "type" : "u64" },
              { "src" : "unevictable_pgs_scanned", "dst" : "unevictable_pgs_scanned", "type" : "u64" },
              { "src" : "unevictable_pgs_rescued", "dst" : "unevictable_pgs_rescued", "type" : "u64" },
              { "src" : "unevictable_pgs_mlocked", "dst" : "unevictable_pgs_mlocked", "type" : "u64" },
              { "src" : "unevictable_pgs_munlocked", "dst" : "unevictable_pgs_munlocked", "type" : "u64" },
              { "src" : "unevictable_pgs_cleared", "dst" : "unevictable_pgs_cleared", "type" : "u64" },
              { "src" : "unevictable_pgs_stranded", "dst" : "unevictable_pgs_stranded", "type" : "u64" },
              { "src" : "thp_fault_alloc", "dst" : "thp_fault_alloc", "type" : "u64" },
              { "src" : "thp_fault_fallback", "dst" : "thp_fault_fallback", "type" : "u64" },
              { "src" : "thp_fault_fallback_charge", "dst" : "thp_fault_fallback_charge", "type" : "u64" },
              { "src" : "thp_collapse_alloc", "dst" : "thp_collapse_alloc", "type" : "u64" },
              { "src" : "thp_collapse_alloc_failed", "dst" : "thp_collapse_alloc_failed", "type" : "u64" },
              { "src" : "thp_file_alloc", "dst" : "thp_file_alloc", "type" : "u64" },
              { "src" : "thp_file_fallback", "dst" : "thp_file_fallback", "type" : "u64" },
              { "src" : "thp_file_fallback_charge", "dst" : "thp_file_fallback_charge", "type" : "u64" },
              { "src" : "thp_file_mapped", "dst" : "thp_file_mapped", "type" : "u64" },
              { "src" : "thp_split_page", "dst" : "thp_split_page", "type" : "u64" },
              { "src" : "thp_split_page_failed", "dst" : "thp_split_page_failed", "type" : "u64" },
              { "src" : "thp_deferred_split_page", "dst" : "thp_deferred_split_page", "type" : "u64" },
              { "src" : "thp_underused_split_page", "dst" : "thp_underused_split_page", "type" : "u64" },
              { "src" : "thp_split_pmd", "dst" : "thp_split_pmd", "type" : "u64" },
              { "src" : "thp_scan_exceed_none_pte", "dst" : "thp_scan_exceed_none_pte", "type" : "u64" },
              { "src" : "thp_scan_exceed_swap_pte", "dst" : "thp_scan_exceed_swap_pte", "type" : "u64" },
              { "src" : "thp_scan_exceed_share_pte", "dst" : "thp_scan_exceed_share_pte", "type" : "u64" },
              { "src" : "thp_split_pud", "dst" : "thp_split_pud", "type" : "u64", "fill" : 0 },
              { "src" : "thp_zero_page_alloc", "dst" : "thp_zero_page_alloc", "type" : "u64" },
              { "src" : "thp_zero_page_alloc_failed", "dst" : "thp_zero_page_alloc_failed", "type" : "u64" },
              { "src" : "thp_swpout", "dst" : "thp_swpout", "type" : "u64" },
              { "src" : "thp_swpout_fallback", "dst" : "thp_swpout_fallback", "type" : "u64" },
              { "src" : "balloon_inflate", "dst" : "balloon_inflate", "type" : "u64" },
              { "src" : "balloon_deflate", "dst" : "balloon_deflate", "type" : "u64" },
              { "src" : "balloon_migrate", "dst" : "balloon_migrate", "type" : "u64" },
              { "src" : "swap_ra", "dst" : "swap_ra", "type" : "u64" },
              { "src" : "swap_ra_hit", "dst" : "swap_ra_hit", "type" : "u64" },
              { "src" : "swpin_zero", "dst" : "swpin_zero", "type" : "u64" },
              { "src" : "swpout_zero", "dst" : "swpout_zero", "type" : "u64" },
              { "src" : "ksm_swpin_copy", "dst" : "ksm_swpin_copy", "type" : "u64" },
              { "src" : "cow_ksm", "dst" : "cow_ksm", "type" : "u64" },
              { "src" : "zswpin", "dst" : "zswpin", "type" : "u64" },
              { "src" : "zswpout", "dst" : "zswpout", "type" : "u64" },
              { "src" : "zswpwb", "dst" : "zswpwb", "type" : "u64" },
              { "src" : "direct_map_level2_splits", "dst" : "direct_map_level2_splits", "type" : "u64", "fill" : 0 },
              { "src" : "direct_map_level3_splits", "dst" : "direct_map_level3_splits", "type" : "u64", "fill" : 0 },
              { "src" : "vma_lock_success", "dst" : "vma_lock_success", "type" : "u64" },
              { "src" : "vma_lock_abort", "dst" : "vma_lock_abort", "type" : "u64" },
              { "src" : "vma_lock_retry", "dst" : "vma_lock_retry", "type" : "u64" },
              { "src" : "vma_lock_miss", "dst" : "vma_lock_miss", "type" : "u64" },
              { "src" : "nr_unaccepted", "dst" : "nr_unaccepted", "type" : "u64", "fill" : 0 },
              { "src" : "nr_unstable", "dst" : "nr_unstable", "type" : "u64" }
            ],
            "indices" : [
            ]
         }
      ]
    },
     "mt_slurm_decomp" : {
       "type" : "static",
       "rows" : [
          {
            "schema" : "mt-slurm",
            "cols" : [
              { "src" : "timestamp", "dst" : "timestamp", "type" : "ts" },
              { "src" : "producer", "dst":"hostname", "type":"char_array", "array_len":128 },
              { "src" : "instance", "dst":"instance", "type":"char_array", "array_len":128 },
              { "src" : "component_id", "dst" : "component_id", "type" : "u64" },
              { "src" : "job_id", "dst" : "job_id", "type" : "u64" },
              { "src" : "app_id", "dst" : "app_id", "type" : "u64" },
              { "src" : "job_slot_list_tail", "dst" : "job_slot_list_tail", "type" : "s32" },
              { "src" : "job_slot_list", "dst" : "job_slot_list", "type" : "s32", "array_len" : 16 },
              { "src" : "job_state", "dst" : "job_state", "type" : "u8", "array_len" : 16 },
              { "src" : "job_size", "dst" : "job_size", "type" : "u32", "array_len" : 16 },
              { "src" : "job_uid", "dst" : "job_uid", "type" : "u32", "array_len" : 16 },
              { "src" : "job_gid", "dst" : "job_gid", "type" : "u32", "array_len" : 16 },
              { "src" : "job_start", "dst" : "job_start", "type" : "u32", "array_len" : 16 },
              { "src" : "job_end", "dst" : "job_end", "type" : "u32", "array_len" : 16 },
              { "src" : "node_count", "dst" : "node_count", "type" : "u32", "array_len" : 16 },
              { "src" : "task_count", "dst" : "task_count", "type" : "u32", "array_len" : 16 },
              { "src" : "task_pid_0", "dst" : "task_pid_0", "type" : "u32", "array_len" : 8 },
              { "src" : "task_pid_1", "dst" : "task_pid_1", "type" : "u32", "array_len" : 8 },
              { "src" : "task_pid_2", "dst" : "task_pid_2", "type" : "u32", "array_len" : 8 },
              { "src" : "task_pid_3", "dst" : "task_pid_3", "type" : "u32", "array_len" : 8 },
              { "src" : "task_pid_4", "dst" : "task_pid_4", "type" : "u32", "array_len" : 8 },
              { "src" : "task_pid_5", "dst" : "task_pid_5", "type" : "u32", "array_len" : 8 },
              { "src" : "task_pid_6", "dst" : "task_pid_6", "type" : "u32", "array_len" : 8 },
              { "src" : "task_pid_7", "dst" : "task_pid_7", "type" : "u32", "array_len" : 8 },
              { "src" : "task_pid_8", "dst" : "task_pid_8", "type" : "u32", "array_len" : 8 },
              { "src" : "task_pid_9", "dst" : "task_pid_9", "type" : "u32", "array_len" : 8 },
              { "src" : "task_pid_10", "dst" : "task_pid_10", "type" : "u32", "array_len" : 8 },
              { "src" : "task_pid_11", "dst" : "task_pid_11", "type" : "u32", "array_len" : 8 },
              { "src" : "task_pid_12", "dst" : "task_pid_12", "type" : "u32", "array_len" : 8 },
              { "src" : "task_pid_13", "dst" : "task_pid_13", "type" : "u32", "array_len" : 8 },
              { "src" : "task_pid_14", "dst" : "task_pid_14", "type" : "u32", "array_len" : 8 },
              { "src" : "task_pid_15", "dst" : "task_pid_15", "type" : "u32", "array_len" : 8 },
              { "src" : "task_rank_0", "dst" : "task_rank_0", "type" : "u32", "array_len" : 8 },
              { "src" : "task_rank_1", "dst" : "task_rank_1", "type" : "u32", "array_len" : 8 },
              { "src" : "task_rank_2", "dst" : "task_rank_2", "type" : "u32", "array_len" : 8 },
              { "src" : "task_rank_3", "dst" : "task_rank_3", "type" : "u32", "array_len" : 8 },
              { "src" : "task_rank_4", "dst" : "task_rank_4", "type" : "u32", "array_len" : 8 },
              { "src" : "task_rank_5", "dst" : "task_rank_5", "type" : "u32", "array_len" : 8 },
              { "src" : "task_rank_6", "dst" : "task_rank_6", "type" : "u32", "array_len" : 8 },
              { "src" : "task_rank_7", "dst" : "task_rank_7", "type" : "u32", "array_len" : 8 },
              { "src" : "task_rank_8", "dst" : "task_rank_8", "type" : "u32", "array_len" : 8 },
              { "src" : "task_rank_9", "dst" : "task_rank_9", "type" : "u32", "array_len" : 8 },
              { "src" : "task_rank_10", "dst" : "task_rank_10", "type" : "u32", "array_len" : 8 },
              { "src" : "task_rank_11", "dst" : "task_rank_11", "type" : "u32", "array_len" : 8 },
              { "src" : "task_rank_12", "dst" : "task_rank_12", "type" : "u32", "array_len" : 8 },
              { "src" : "task_rank_13", "dst" : "task_rank_13", "type" : "u32", "array_len" : 8 },
              { "src" : "task_rank_14", "dst" : "task_rank_14", "type" : "u32", "array_len" : 8 },
              { "src" : "task_rank_15", "dst" : "task_rank_15", "type" : "u32", "array_len" : 8 },
              { "src" : "task_exit_status_0", "dst" : "task_exit_status_0", "type" : "u32", "array_len" : 8 },
              { "src" : "task_exit_status_1", "dst" : "task_exit_status_1", "type" : "u32", "array_len" : 8 },
              { "src" : "task_exit_status_2", "dst" : "task_exit_status_2", "type" : "u32", "array_len" : 8 },
              { "src" : "task_exit_status_3", "dst" : "task_exit_status_3", "type" : "u32", "array_len" : 8 },
              { "src" : "task_exit_status_4", "dst" : "task_exit_status_4", "type" : "u32", "array_len" : 8 },
              { "src" : "task_exit_status_5", "dst" : "task_exit_status_5", "type" : "u32", "array_len" : 8 },
              { "src" : "task_exit_status_6", "dst" : "task_exit_status_6", "type" : "u32", "array_len" : 8 },
              { "src" : "task_exit_status_7", "dst" : "task_exit_status_7", "type" : "u32", "array_len" : 8 },
              { "src" : "task_exit_status_8", "dst" : "task_exit_status_8", "type" : "u32", "array_len" : 8 },
              { "src" : "task_exit_status_9", "dst" : "task_exit_status_9", "type" : "u32", "array_len" : 8 },
              { "src" : "task_exit_status_10", "dst" : "task_exit_status_10", "type" : "u32", "array_len" : 8 },
              { "src" : "task_exit_status_11", "dst" : "task_exit_status_11", "type" : "u32", "array_len" : 8 },
              { "src" : "task_exit_status_12", "dst" : "task_exit_status_12", "type" : "u32", "array_len" : 8 },
              { "src" : "task_exit_status_13", "dst" : "task_exit_status_13", "type" : "u32", "array_len" : 8 },
              { "src" : "task_exit_status_14", "dst" : "task_exit_status_14", "type" : "u32", "array_len" : 8 },
              { "src" : "task_exit_status_15", "dst" : "task_exit_status_15", "type" : "u32", "array_len" : 8 },
              { "src" : "user_0", "dst" : "user_0", "type" : "char_array", "array_len" : 64 },
              { "src" : "user_1", "dst" : "user_1", "type" : "char_array", "array_len" : 64 },
              { "src" : "user_2", "dst" : "user_2", "type" : "char_array", "array_len" : 64 },
              { "src" : "user_3", "dst" : "user_3", "type" : "char_array", "array_len" : 64 },
              { "src" : "user_4", "dst" : "user_4", "type" : "char_array", "array_len" : 64 },
              { "src" : "user_5", "dst" : "user_5", "type" : "char_array", "array_len" : 64 },
              { "src" : "user_6", "dst" : "user_6", "type" : "char_array", "array_len" : 64 },
              { "src" : "user_7", "dst" : "user_7", "type" : "char_array", "array_len" : 64 },
              { "src" : "user_8", "dst" : "user_8", "type" : "char_array", "array_len" : 64 },
              { "src" : "user_9", "dst" : "user_9", "type" : "char_array", "array_len" : 64 },
              { "src" : "user_10", "dst" : "user_10", "type" : "char_array", "array_len" : 64 },
              { "src" : "user_11", "dst" : "user_11", "type" : "char_array", "array_len" : 64 },
              { "src" : "user_12", "dst" : "user_12", "type" : "char_array", "array_len" : 64 },
              { "src" : "user_13", "dst" : "user_13", "type" : "char_array", "array_len" : 64 },
              { "src" : "user_14", "dst" : "user_14", "type" : "char_array", "array_len" : 64 },
              { "src" : "user_15", "dst" : "user_15", "type" : "char_array", "array_len" : 64 },
              { "src" : "job_name_0", "dst" : "job_name_0", "type" : "char_array", "array_len" : 128 },
              { "src" : "job_name_1", "dst" : "job_name_1", "type" : "char_array", "array_len" : 128 },
              { "src" : "job_name_2", "dst" : "job_name_2", "type" : "char_array", "array_len" : 128 },
              { "src" : "job_name_3", "dst" : "job_name_3", "type" : "char_array", "array_len" : 128 },
              { "src" : "job_name_4", "dst" : "job_name_4", "type" : "char_array", "array_len" : 128 },
              { "src" : "job_name_5", "dst" : "job_name_5", "type" : "char_array", "array_len" : 128 },
              { "src" : "job_name_6", "dst" : "job_name_6", "type" : "char_array", "array_len" : 128 },
              { "src" : "job_name_7", "dst" : "job_name_7", "type" : "char_array", "array_len" : 128 },
              { "src" : "job_name_8", "dst" : "job_name_8", "type" : "char_array", "array_len" : 128 },
              { "src" : "job_name_9", "dst" : "job_name_9", "type" : "char_array", "array_len" : 128 },
              { "src" : "job_name_10", "dst" : "job_name_10", "type" : "char_array", "array_len" : 128 },
              { "src" : "job_name_11", "dst" : "job_name_11", "type" : "char_array", "array_len" : 128 },
              { "src" : "job_name_12", "dst" : "job_name_12", "type" : "char_array", "array_len" : 128 },
              { "src" : "job_name_13", "dst" : "job_name_13", "type" : "char_array", "array_len" : 128 },
              { "src" : "job_name_14", "dst" : "job_name_14", "type" : "char_array", "array_len" : 128 },
              { "src" : "job_name_15", "dst" : "job_name_15", "type" : "char_array", "array_len" : 128 },
              { "src" : "job_tag_0", "dst" : "job_tag_0", "type" : "char_array", "array_len" : 128 },
              { "src" : "job_tag_1", "dst" : "job_tag_1", "type" : "char_array", "array_len" : 128 },
              { "src" : "job_tag_2", "dst" : "job_tag_2", "type" : "char_array", "array_len" : 128 },
              { "src" : "job_tag_3", "dst" : "job_tag_3", "type" : "char_array", "array_len" : 128 },
              { "src" : "job_tag_4", "dst" : "job_tag_4", "type" : "char_array", "array_len" : 128 },
              { "src" : "job_tag_5", "dst" : "job_tag_5", "type" : "char_array", "array_len" : 128 },
              { "src" : "job_tag_6", "dst" : "job_tag_6", "type" : "char_array", "array_len" : 128 },
              { "src" : "job_tag_7", "dst" : "job_tag_7", "type" : "char_array", "array_len" : 128 },
              { "src" : "job_tag_8", "dst" : "job_tag_8", "type" : "char_array", "array_len" : 128 },
              { "src" : "job_tag_9", "dst" : "job_tag_9", "type" : "char_array", "array_len" : 128 },
              { "src" : "job_tag_10", "dst" : "job_tag_10", "type" : "char_array", "array_len" : 128 },
              { "src" : "job_tag_11", "dst" : "job_tag_11", "type" : "char_array", "array_len" : 128 },
              { "src" : "job_tag_12", "dst" : "job_tag_12", "type" : "char_array", "array_len" : 128 },
              { "src" : "job_tag_13", "dst" : "job_tag_13", "type" : "char_array", "array_len" : 128 },
              { "src" : "job_tag_14", "dst" : "job_tag_14", "type" : "char_array", "array_len" : 128 },
              { "src" : "job_tag_15", "dst" : "job_tag_15", "type" : "char_array", "array_len" : 128 }
            ],
            "indices" : [
            ]
         }
      ]
    }
  },
  "digest" : {
    "3CF504E5D2A16DB96981AE0F0A0BDCA289E414703625A7B527633712060B9A66" : "dcgm_decomp",
    "8BE378143DF8894C6C911EE1934E5BF166BAD9C012013D1E9F1361F0ACC249E1" : "loadavg_decomp",
    "EF4141E721CF871A14A0751296C04A439BD78F448721145DB896EB024D7C3829" : "lustre_llite_decomp",
    "EF957A75E226C57176D45950B7281DB1775E4EC86DFE4F7921C8E5210FD2A7EB" : "meminfo_decomp",
    "1DFDD62FB6C37AE8A96FA04C5D7975BBFCCBE4C8A12A86678A2AF259F49A1BA4" : "meminfo_decomp",
    "E8B9CC8D83FB4E5B779071E801CA351B69DCB9E9CE2601A0B127A2977F11C62A" : "procnetdev2_decomp",
    "78935B2B0B932E5FDFD20CF29B561B842978B4A5E75663A3AEB02FD5E3F7712E" : "procstat2_decomp",
    "FB038D1C7A059BD675F0C06447F8644AD064583026174B998B904729D23F9487" : "slingshot_info_decomp",
    "181972BDD114E997CC71AD6979056DA3C172B640F130DB143649E1355C4F5599" : "slingshot_metrics_decomp",
    "85CE1C60D0570924DAE5B17758912D1A3ADA2091ABD946E06B9A0240F53F4FD8" : "vmstat_decomp",
    "9292CFE0558DBE06EF95BE5B97A9FA13A3F66CF1523D3E175816F3F0D9C66DD4" : "vmstat_decomp",
    "42EB25BA6239F4883E05847676F9BE49B10BD059A714A1C95A932048A19D8D74" : "vmstat_decomp",
    "F76BA26012C2F1F481AB0C1E0672D438ECFE0C4F7B2B4942AA7067A1FCE51A75" : "mt_slurm_decomp"
  }
}


================================================
FILE: discovery/roles/telemetry/files/nersc-ldms-aggr/scripts/kafka.conf
================================================
# Kafka Configuration for LDMS store_avro_kafka with TLS/mTLS
# This file configures librdkafka to connect to Kafka with TLS encryption
# See: https://github.com/edenhill/librdkafka/blob/master/CONFIGURATION.md

# Kafka broker(s) with TLS port (9093)
bootstrap.servers=kafka-kafka-bootstrap.telemetry.svc.cluster.local:9093

# Security protocol: SSL for TLS/mTLS
security.protocol=SSL

# TLS/SSL Configuration
# CA certificate to verify broker's certificate
ssl.ca.location=/ldms_certs/ca.crt

# Client certificate for mTLS authentication
ssl.certificate.location=/ldms_certs/user.crt

# Client private key for mTLS authentication
ssl.key.location=/ldms_certs/user.key

# Optional: Endpoint identification algorithm
# ssl.endpoint.identification.algorithm=https


================================================
FILE: discovery/roles/telemetry/files/nersc-ldms-aggr/scripts/ldms_ls.bash
================================================
#!/bin/sh

OUTPUT="$(/opt/ovis-ldms/sbin/ldms_ls -a ${LDMSD_AUTH_PLUGIN} -A ${LDMSD_AUTH_OPTION} -x sock -h ${LDMSD_HOST} -p ${LDMSD_PORT} -v)"
# to make this: {"Summary":[{"TotalSets":"12859"},{"MetaData_kB":"27756.42"},{"Data_kB":"4178.67"},{"Memory_kB":"31935.10"}]}
echo "$OUTPUT" |grep Tot | sed -e 's|(kB)|_kB|g' -e 's/: /=/g' -e 's/kB /kB=/g' -e 's/ //g' |jq -rc --raw-input 'split(",") | map(split("=") | { (.[0]): .[1] })|{"Summary":.}'
# to make this: {"cray_dvs":27,"cray_iostat":558,"cray_vmstat":4121,"dcgm":6174,"ldmsd_grp_schema":48}
echo "$OUTPUT" |awk '{print $1}' |egrep -v 'Total|Schema|^$|---' |sort |uniq -c |awk '{print "\""$2"\"" ":" $1}' |paste -s -d',' | awk '{print "{" $1 "}"}' | jq -cC


================================================
FILE: discovery/roles/telemetry/files/nersc-ldms-aggr/scripts/ldms_msg_publish.py
================================================
#!/usr/bin/env python3
# -*- coding: utf-8 -*-
"""
LDMS Stream Message Publisher

Publishes messages to LDMS daemon stream for testing and monitoring.
"""

import sys
import argparse

sys.path.append('/opt/ovis-ldms/lib/python3.6/site-packages')
from ovis_ldms import ldms  # pylint: disable=wrong-import-position,import-error

parser = argparse.ArgumentParser(description='Publish LDMS stream message')
parser.add_argument('--host', default='localhost', help='LDMS daemon host (default: localhost)')
parser.add_argument(
    '--port', type=int, default=10001,
    help='LDMS daemon port (default: 10001 for samplers, '
         'use 6001+ for aggregators, 60001 for stream daemon)'
)
parser.add_argument('--message', default='This is a test', help='Message to publish')
args = parser.parse_args()

ldms.init(16 * 1024 * 1024)
x = ldms.Xprt("sock", "munge")
x.connect(args.host, args.port)
x.msg_publish("nersc", args.message)
print(f"Published to {args.host}:{args.port} - {args.message}")


================================================
FILE: discovery/roles/telemetry/files/nersc-ldms-aggr/scripts/ldms_msg_subscribe.py
================================================
#!/usr/bin/env python3
# -*- coding: utf-8 -*-
"""
LDMS Stream Message Subscriber

Subscribes to and displays LDMS daemon stream messages for monitoring.
"""

import time
import sys
import argparse

sys.path.append('/opt/ovis-ldms/lib/python3.6/site-packages')
from ovis_ldms import ldms  # pylint: disable=wrong-import-position,import-error

parser = argparse.ArgumentParser(description='Subscribe to LDMS stream messages')
parser.add_argument('--host', default='localhost', help='LDMS daemon host (default: localhost)')
parser.add_argument(
    '--port', type=int, default=10001,
    help='LDMS daemon port (default: 10001 for samplers, '
         'use 6001+ for aggregators, 60001 for stream daemon)'
)
args = parser.parse_args()

mc = ldms.MsgClient(".*", True)

x = ldms.Xprt("sock", "munge")
x.connect(args.host, args.port)
x.msg_subscribe("nersc", True)
print(f"Subscribed to {args.host}:{args.port}")

while True:
    d = mc.get_data()
    while d is None:
        time.sleep(0.25)
        d = mc.get_data()
    ts = time.strftime("%F %T") + f".{int((time.time() % 1) * 1e6):06}"
    print(ts, d.name, ":", d.data)


================================================
FILE: discovery/roles/telemetry/files/nersc-ldms-aggr/scripts/ldms_stats.bash
================================================
#!/bin/sh

# NOTE: This script queries an existing ldmsd daemon, it doesn't start one
# Removed line that would start ldmsd (with obsolete -P 4 option)

HOST="${LDMSD_HOST}"
PORT="${LDMSD_PORT}"
AUTH="${LDMSD_AUTH_PLUGIN}"
AUTH_ARG=""
NOW="$(date +"%Y%m%d-%H%M%S")"
echo "=====================
DATE:$NOW
SCRIPT:$0
LDMSD_HOST:$LDMSD_HOST
LDMSD_PORT:$LDMSD_PORT
LDMSD_AUTH_PLUGIN:$LDMSD_AUTH_PLUGIN
LDMSD_AUTH_OPTION:$LDMSD_AUTH_OPTION
====================="
echo "
======================
daemon_status:
======================
"
/opt/ovis-ldms/bin/ldmsd_controller -a ${LDMSD_AUTH_PLUGIN} -A ${LDMSD_AUTH_OPTION} -x sock -h ${LDMSD_HOST} -p ${LDMSD_PORT} --cmd daemon_status
echo "
======================
updtr_status summary:
======================
"
/opt/ovis-ldms/bin/ldmsd_controller -a ${LDMSD_AUTH_PLUGIN} -A ${LDMSD_AUTH_OPTION} -x sock -h ${LDMSD_HOST} -p ${LDMSD_PORT} --cmd "updtr_status summary"
echo "
===================
prdcr_stats:
===================
"
/opt/ovis-ldms/bin/ldmsd_controller -a ${LDMSD_AUTH_PLUGIN} -A ${LDMSD_AUTH_OPTION} -x sock -h ${LDMSD_HOST} -p ${LDMSD_PORT} --cmd prdcr_stats
echo "
===================
strgp_status:
===================
"
/opt/ovis-ldms/bin/ldmsd_controller -a ${LDMSD_AUTH_PLUGIN} -A ${LDMSD_AUTH_OPTION} -x sock -h ${LDMSD_HOST} -p ${LDMSD_PORT} --cmd strgp_status
echo "
===================
stream_status:
===================
"
/opt/ovis-ldms/bin/ldmsd_controller -a ${LDMSD_AUTH_PLUGIN} -A ${LDMSD_AUTH_OPTION} -x sock -h ${LDMSD_HOST} -p ${LDMSD_PORT} --cmd stream_status
echo "
===================
update_time_stats:
===================
"
/opt/ovis-ldms/bin/ldmsd_controller -a ${LDMSD_AUTH_PLUGIN} -A ${LDMSD_AUTH_OPTION} -x sock -h ${LDMSD_HOST} -p ${LDMSD_PORT} --cmd update_time_stats
echo "
===================
thread_stats:
===================
"
/opt/ovis-ldms/bin/ldmsd_controller -a ${LDMSD_AUTH_PLUGIN} -A ${LDMSD_AUTH_OPTION} -x sock -h ${LDMSD_HOST} -p ${LDMSD_PORT} --cmd "thread_stats"
echo "
===================
set_stats: (Units: Bytes/sec)
===================
"
/opt/ovis-ldms/bin/ldmsd_controller -a ${LDMSD_AUTH_PLUGIN} -A ${LDMSD_AUTH_OPTION} -x sock -h ${LDMSD_HOST} -p ${LDMSD_PORT} --cmd "set_stats"


================================================
FILE: discovery/roles/telemetry/files/nersc-ldms-aggr/scripts/ldmsd.bash
================================================
#!/bin/sh
# Removed obsolete -P 4 option (thread pool configuration is now automatic in newer LDMS versions)
LD_LIBRARY_PATH=$LD_LIBRARY_PATH:/usr/local/lib/libserdes.so /opt/ovis-ldms/sbin/ldmsd -F -c ${LDMSD_CONF} -m 128M -a ${LDMSD_AUTH_PLUGIN} -A ${LDMSD_AUTH_OPTION} -x sock:${LDMSD_PORT} -v INFO


================================================
FILE: discovery/roles/telemetry/files/nersc-ldms-aggr/scripts/ldmsd_stream.bash
================================================
#!/bin/sh
# Removed obsolete -P 4 option (thread pool configuration is now automatic in newer LDMS versions)
LD_LIBRARY_PATH=$LD_LIBRARY_PATH:/usr/local/lib/libserdes.so /opt/ovis-ldms/sbin/ldmsd -F -c ${LDMSD_CONF} -m 128M -a ${LDMSD_AUTH_PLUGIN} -A ${LDMSD_AUTH_OPTION} -x sock:${LDMSD_PORT} -v INFO


================================================
FILE: discovery/roles/telemetry/files/nersc-ldms-aggr/scripts/start_munge.bash
================================================
#!/bin/bash
echo "[--] START MUNGED"
if [ -z "$1" ]; then
  echo "USAGE: $0 <conf file>"
  exit 1
fi
CONF_FILE="$1"
echo "[>>] Show CONF_FILE:$CONF_FILE"
cat $CONF_FILE
echo "[>>] Source CONF_FILE:$CONF_FILE"
source $CONF_FILE
echo "[>>] Stop running munged: $MUNGE_PID_FILES"
if [ -f  "$MUNGE_PID_FILE" ]; then
  echo "[>>] kill munged"
  kill -9 $(cat $MUNGE_PID_FILE)
else
  echo "[OK] No munged"
fi
echo "[>>] Find munge key: $MUNGE_KEY_FILE"
if [ -f "$MUNGE_KEY_FILE" ]; then
  echo "OK[] Munge key does exist."
else
  echo "[!!] Munge key does not exist. Exit!"
  exit 1
fi
echo "[--] Setup Files, Dirs, and perms"
if [ ! -d "$MUNGE_RUN_DIR" ]; then
  echo "[>>] Make Running directory: $MUNGE_RUN_DIR"
  mkdir "$MUNGE_RUN_DIR"
else
  echo "[OK] Found Running directory: $MUNGE_RUN_DIR"
fi
if [ ! -d "$MUNGE_LOG_DIR" ]; then
  echo "[>>] Make munge log dir: $MUNGE_LOG_DIR"
  mkdir -p "$MUNGE_LOG_DIR"
else
  echo "[OK] Found munge log dir: $MUNGE_LOG_DIR"
fi
echo "Fix Perms"
chown -v munge:munge /var/lib/munge $MUNGE_LOG_DIR
chown -v munge:root $MUNGE_RUN_DIR
chmod -v 0711 /var/lib/munge
chmod -v 0700 $MUNGE_LOG_DIR
echo "[>>] Vars
Bin File:    $MUNGED_BIN
Key File:    $MUNGE_KEY_FILE
Pid File:    $MUNGE_PID_FILE
Socket File: $MUNGE_SOCKET_FILE
Log File:    $MUNGE_LOG_File
"
echo "[>>] Start Munge"
$MUNGED_BIN \
  --verbose \
  --force \
  --num-threads=256 \
  --key-file $MUNGE_KEY_FILE \
  --log-file $MUNGE_LOG_FILE \
  --seed-file /var/lib/munge/munged.seed \
  --socket $MUNGE_SOCKET_FILE \
  --pid-file $MUNGE_PID_FILE
echo "[>>] List running Munged"
ps -elf |grep $(cat $MUNGE_PID_FILE)
echo "[>>] Test1: munge|unmune"
munge -n --socket=$MUNGE_SOCKET_FILE |unmunge --socket=$MUNGE_SOCKET_FILE
echo "[>>] Test2:  munge|unmune"
echo "PASS" | munge --socket=$MUNGE_SOCKET_FILE |unmunge --socket=$MUNGE_SOCKET_FILE
if [ $? -ne 0 ]; then
    echo "[!!] Failed to munge |unmunge"
    kill -9 $(cat $MUNGE_PID_FILE)
    exit 1
fi


================================================
FILE: discovery/roles/telemetry/tasks/apply_telemetry_on_upgrade.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Apply telemetry configurations for upgrade
  when:
    - kube_vip is defined
    - kube_vip | length > 0
    - hostvars['localhost']['idrac_telemetry_support'] | default(false) | bool
  block:
    - name: Check if telemetry deployment file exists
      ansible.builtin.stat:
        path: "{{ idrac_telemetry_statefulset_path }}"
      register: telemetry_stat

    - name: Apply iDRAC telemetry StatefulSet using kubectl
      ansible.builtin.command:
        cmd: "kubectl apply -f {{ idrac_telemetry_statefulset_path }}"
      delegate_to: "{{ kube_vip }}"
      register: kubectl_apply_result
      changed_when: "'configured' in kubectl_apply_result.stdout or 'created' in kubectl_apply_result.stdout"
      failed_when: false
      when:
        - telemetry_stat.stat.exists | default(false)

    - name: Display kubectl apply result
      ansible.builtin.debug:
        msg: "{{ kubectl_apply_result.stdout_lines }}"
      when:
        - kubectl_apply_result is defined
        - kubectl_apply_result.stdout_lines is defined

    - name: Wait for idrac telemetry receiver to be ready
      kubernetes.core.k8s_info:
        api_version: v1
        kind: Pod
        namespace: "{{ telemetry_namespace }}"
        label_selectors:
          - "app=idrac-telemetry-receiver"
        wait: true
        wait_condition:
          type: Ready
          status: "True"
        wait_timeout: 120
      delegate_to: "{{ kube_vip }}"
      register: idrac_telemetry_receiver_ready
      failed_when: false
      when:
        - hostvars['localhost']['idrac_telemetry_support'] | default(false) | bool

    - name: Display idrac telemetry receiver ready status
      ansible.builtin.debug:
        msg: "{{ idrac_telemetry_receiver_ready }}"
      when:
        - hostvars['localhost']['idrac_telemetry_support'] | default(false) | bool
        - idrac_telemetry_receiver_ready is defined

- name: Apply LDMS configurations for upgrade
  when:
    - kube_vip is defined
    - kube_vip | length > 0
    - hostvars['localhost']['ldms_support'] | default(false) | bool
  block:
    - name: Check if LDMS aggregator is running on service k8s cluster
      kubernetes.core.k8s_info:
        api_version: apps/v1
        kind: StatefulSet
        name: nersc-ldms-aggr
        namespace: "{{ telemetry_namespace }}"
      delegate_to: "{{ kube_vip }}"
      register: ldms_statefulset_info
      failed_when: false

    - name: Set LDMS running state
      ansible.builtin.set_fact:
        ldms_running: "{{ ldms_statefulset_info.resources is defined and ldms_statefulset_info.resources | length > 0 }}"

    - name: Check if decomp.json exists
      ansible.builtin.stat:
        path: "{{ hostvars['localhost']['k8s_client_share_path'] }}/telemetry/ldms/nersc-ldms-aggr/scripts/decomp.json"
      register: decomp_json_stat

    - name: Copy decompose.json if it doesn't exist
      ansible.builtin.copy:
        src: files/scripts/decomp.json
        dest: "{{ hostvars['localhost']['k8s_client_share_path'] }}/telemetry/ldms/nersc-ldms-aggr/scripts/decomp.json"
        mode: "{{ hostvars['localhost']['file_permissions_644'] }}"
      when: not decomp_json_stat.stat.exists

    - name: Restart LDMS aggregator StatefulSet
      kubernetes.core.k8s:
        state: present
        definition:
          apiVersion: apps/v1
          kind: StatefulSet
          metadata:
            name: nersc-ldms-aggr
            namespace: "{{ telemetry_namespace }}"
          spec:
            template:
              metadata:
                annotations:
                  kubectl.kubernetes.io/restartedAt: "{{ ansible_date_time.iso8601 }}"
      delegate_to: "{{ kube_vip }}"
      failed_when: false
      when:
        - ldms_running | default(false) | bool
        - ldms_conf_file.stat.exists | default(false)
        - ldms_bin_file.stat.exists | default(false)

    - name: Wait for LDMS aggregator pod to be ready after restart
      kubernetes.core.k8s_info:
        api_version: v1
        kind: Pod
        namespace: "{{ telemetry_namespace }}"
        label_selectors:
          - "app=nersc-ldms-aggr"
        wait: true
        wait_condition:
          type: Ready
          status: "True"
        wait_timeout: 120
      delegate_to: "{{ kube_vip }}"
      register: ldms_pod_ready
      failed_when: false
      when:
        - ldms_running | default(false) | bool
        - ldms_conf_file.stat.exists | default(false)
        - ldms_bin_file.stat.exists | default(false)

    - name: Display LDMS aggregator restart status
      ansible.builtin.debug:
        msg: "{{ ldms_pod_ready_msg if (ldms_pod_ready.resources | default([]) | length > 0) else ldms_pod_not_ready_msg }}"
      when:
        - ldms_running | default(false) | bool
        - ldms_conf_file.stat.exists | default(false)
        - ldms_bin_file.stat.exists | default(false)


================================================
FILE: discovery/roles/telemetry/tasks/check_pxe_changes.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Check if current PXE mapping file exists
  ansible.builtin.stat:
    path: "{{ hostvars['localhost']['pxe_mapping_file_path'] }}"
  delegate_to: localhost
  register: current_pxe_file

- name: Check if backup PXE mapping file exists
  ansible.builtin.stat:
    path: "{{ backup_pxe_mapping_ldms_path }}"
  delegate_to: localhost
  register: backup_pxe_file

- name: Handle first discovery run (no backup exists)
  when:
    - current_pxe_file.stat.exists
    - not backup_pxe_file.stat.exists
  block:
    - name: Create backup of PXE mapping file
      ansible.builtin.copy:
        src: "{{ hostvars['localhost']['pxe_mapping_file_path'] }}"
        dest: "{{ backup_pxe_mapping_ldms_path }}"
        remote_src: true
        mode: preserve
      delegate_to: localhost

    - name: Set pxe_changed to false for first run
      ansible.builtin.set_fact:
        pxe_changed: false

    - name: Display first run message
      ansible.builtin.debug:
        msg: "{{ pxe_first_run_msg }}"

- name: Compare PXE mapping files when backup exists
  when:
    - current_pxe_file.stat.exists
    - backup_pxe_file.stat.exists
  block:
    - name: Get checksum of current PXE mapping file
      ansible.builtin.stat:
        path: "{{ hostvars['localhost']['pxe_mapping_file_path'] }}"
        checksum_algorithm: sha256
      delegate_to: localhost
      register: current_pxe_checksum

    - name: Get checksum of backup PXE mapping file
      ansible.builtin.stat:
        path: "{{ backup_pxe_mapping_ldms_path }}"
        checksum_algorithm: sha256
      delegate_to: localhost
      register: backup_pxe_checksum

    - name: Set pxe_changed based on checksum comparison
      ansible.builtin.set_fact:
        pxe_changed: "{{ current_pxe_checksum.stat.checksum != backup_pxe_checksum.stat.checksum }}"

    - name: Update backup PXE mapping file when changed
      ansible.builtin.copy:
        src: "{{ hostvars['localhost']['pxe_mapping_file_path'] }}"
        dest: "{{ backup_pxe_mapping_ldms_path }}"
        remote_src: true
        mode: preserve
      delegate_to: localhost
      when: pxe_changed | bool

    - name: Display PXE change status
      ansible.builtin.debug:
        msg: "{{ pxe_changed_msg if (pxe_changed | bool) else pxe_no_change_msg }}"

- name: Set pxe_changed to false when PXE file is missing
  ansible.builtin.set_fact:
    pxe_changed: false
  when: not current_pxe_file.stat.exists


================================================
FILE: discovery/roles/telemetry/tasks/generate_service_cluster_metadata.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Pre-requisites for service_cluster k8s
  when:
    - hostvars['localhost']['idrac_telemetry_support']
  block:
    - name: Include service_cluster metadata if already exists
      ansible.builtin.include_vars: "{{ service_cluster_metadata_path }}"
      delegate_to: localhost
      connection: local
      no_log: true
      failed_when: false

    - name: Fetch service_cluster info
      get_service_cluster_info:
        nodes_info: "{{ node_parsed_yaml.nodes }}"
        functional_groups_file_path: "{{ functional_groups_config_path }}"
        bmc_group_data: "{{ bmc_dict_list | default([]) }}"
      register: service_cluster_info_output
      delegate_to: localhost
      connection: local

    - name: Set fact for service_cluster role required and other facts
      ansible.builtin.set_fact:
        service_cluster_node_details: "{{ service_cluster_info_output.service_cluster_node_details | default({}) }}"

    - name: Create and update service node metadata file
      ansible.builtin.copy:
        dest: "{{ service_cluster_metadata_path }}"
        content: "{{ {'kube_client_share_path': service_cluster_idrac_telemetry_dir_path, 'kube_vip': kube_vip, 'service_cluster_metadata': service_cluster_node_details} | to_nice_yaml }}" # noqa: yaml[line-length]
        mode: "{{ metadata_perm }}"
        force: true
      delegate_to: localhost
      connection: local
      no_log: true


================================================
FILE: discovery/roles/telemetry/tasks/generate_telemetry_deployments.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Create cleanup directory for telemetry cleanup scripts
  ansible.builtin.file:
    path: "{{ hostvars['localhost']['k8s_client_share_path'] }}/telemetry/cleanup"
    state: directory
    mode: "{{ hostvars['localhost']['dir_permissions_755'] }}"
  tags: telemetry_deployment

- name: Create test directory for TLS test jobs
  ansible.builtin.file:
    path: "{{ hostvars['localhost']['k8s_client_share_path'] }}/telemetry/deployments/test"
    state: directory
    mode: "{{ hostvars['localhost']['dir_permissions_755'] }}"
  tags: telemetry_deployment

- name: Populate Victoria deployment configs
  ansible.builtin.template:
    src: "{{ item.src }}"
    dest: "{{ hostvars['localhost']['k8s_client_share_path'] }}/telemetry/deployments/{{ item.dest }}"
    mode: "{{ hostvars['localhost']['file_permissions_644'] }}"
  loop: "{{ victoria_templates }}"
  when: "'victoria' in hostvars['localhost']['idrac_telemetry_collection_type'].split(',')"
  tags: telemetry_deployment
  # NOTE: victoria_templates is automatically set based on deployment_mode in telemetry_config.yml
  #       - cluster mode: includes vmstorage, vminsert, vmselect templates
  #       - single-node mode: includes victoria-statefulset template

- name: Kafka configurations
  when: kafka_support
  block:
    - name: Set Kafka configuration variables from telemetry_config
      ansible.builtin.set_fact:
        kafka_log_retention_hours: "{{ telemetry_config.kafka_configurations.log_retention_hours }}"
        kafka_log_retention_bytes: "{{ telemetry_config.kafka_configurations.log_retention_bytes }}"
        kafka_log_segment_bytes: "{{ telemetry_config.kafka_configurations.log_segment_bytes }}"

    - name: Create kafka_topic_partitions dictionary from telemetry_config
      ansible.builtin.set_fact:
        kafka_topic_partitions: >-
          {{
            dict(
              telemetry_config.kafka_configurations.topic_partitions | map(attribute='name')
              | zip(telemetry_config.kafka_configurations.topic_partitions | map(attribute='partitions'))
            )
          }}

    - name: Build list of Kafka topics to create
      ansible.builtin.set_fact:
        kafka_topics_to_create: []

    - name: Add idrac topic if enabled
      ansible.builtin.set_fact:
        kafka_topics_to_create: >
          {{ kafka_topics_to_create + [{
            'name': kafka.topics.idrac.name,
            'key': kafka.topics.idrac.name,
            'filename': 'kafka.topic_idrac.yaml'
          }] }}
      when:
        - hostvars['localhost']['idrac_telemetry_support']
        - "'kafka' in hostvars['localhost']['idrac_telemetry_collection_type'].split(',')"
        - "kafka.topics.idrac.name in kafka_topic_partitions"

    - name: Add ldms topic if enabled
      ansible.builtin.set_fact:
        kafka_topics_to_create: >
          {{ kafka_topics_to_create + [{
            'name': kafka.topics.ldms.name,
            'key': kafka.topics.ldms.name,
            'filename': 'kafka.topic_ldms.yaml'
          }] }}
      when:
        - hostvars['localhost']['ldms_support']
        - "kafka.topics.ldms.name in kafka_topic_partitions"


    - name: Generate Kafka topic files dynamically
      ansible.builtin.template:
        src: 'telemetry/kafka/kafka.topic.yaml.j2'
        dest: "{{ hostvars['localhost']['k8s_client_share_path'] }}/telemetry/deployments/{{ item.filename }}"
        mode: "{{ hostvars['localhost']['file_permissions_644'] }}"
      loop: "{{ kafka_topics_to_create }}"
      vars:
        topic_name: "{{ item.name }}"
        topic_key: "{{ item.key }}"

    - name: Populate telemetry deployment configs for kafka
      ansible.builtin.template:
        src: "{{ item.src }}"
        dest: "{{ hostvars['localhost']['k8s_client_share_path'] }}/telemetry/deployments/{{ item.dest }}"
        mode: "{{ hostvars['localhost']['file_permissions_644'] }}"
      loop: "{{ kafka_templates }}"

    - name: Extract and set facts for tarball URLs for strmzi kafka
      ansible.builtin.set_fact:
        strimzi_kafka_pkg: "{{ k8s_packages_json['service_k8s']['cluster'] | selectattr('type', 'equalto', 'tarball') | selectattr('package', 'search', 'strimzi-kafka-operator') | map(attribute='package') | join }}" # noqa: yaml[line-length]

    - name: Download strmzi kafka tarball
      ansible.builtin.get_url:
        url: "{{ strmzi_kafka_tarball_url }}"
        dest: "{{ hostvars['localhost']['k8s_client_share_path'] }}/telemetry/{{ strimzi_kafka_pkg }}.tar.gz"
        mode: "{{ hostvars['localhost']['file_permissions_644'] }}"

- name: Populate common telemetry deployment configs
  ansible.builtin.template:
    src: "{{ item.src }}"
    dest: "{{ hostvars['localhost']['k8s_client_share_path'] }}/telemetry/deployments/{{ item.dest }}"
    mode: "{{ hostvars['localhost']['file_permissions_644'] }}"
  loop: "{{ common_templates }}"
  when: item.skip_when is not defined or not item.skip_when | bool
  tags: telemetry_deployment

- name: Populate iDRAC telemetry statefulset
  ansible.builtin.template:
    src: 'telemetry/idrac_telemetry/idrac_telemetry_statefulset.yaml.j2'
    dest: "{{ hostvars['localhost']['k8s_client_share_path'] }}/telemetry/deployments/idrac_telemetry_statefulset.yaml"
    mode: "{{ hostvars['localhost']['file_permissions_644'] }}"
  when: hostvars['localhost']['idrac_telemetry_support']
  tags: telemetry_deployment

- name: Deploy telemetry cleanup script
  ansible.builtin.template:
    src: 'telemetry/cleanup_telemetry.sh.j2'
    dest: "{{ hostvars['localhost']['k8s_client_share_path'] }}/telemetry/cleanup/cleanup_telemetry.sh"
    mode: "{{ hostvars['localhost']['file_permissions_755'] }}"
  tags: telemetry_deployment


================================================
FILE: discovery/roles/telemetry/tasks/load_service_images.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Extract image packages from service_k8s.json
  ansible.builtin.set_fact:
    service_k8s_image_list: "{{ telemetry_packages['service_k8s']['cluster'] | selectattr('type', 'equalto', 'image') | list }}"

- name: Create service images mapping
  ansible.builtin.set_fact:
    service_k8s_images: >-
      {{
        service_k8s_images | default({}) | combine({
          item.package.split('/')[-2:] | join('/') if '/' in item.package else item.package.split('.')[-1]:
          item.package + ':' + item.tag
        })
      }}
  loop: "{{ service_k8s_image_list }}"

- name: Debug service images mapping
  ansible.builtin.debug:
    var: service_k8s_images
    verbosity: 2
  when: telemetry_debug | default(false)


================================================
FILE: discovery/roles/telemetry/tasks/main.yml
================================================
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Include telemetry configuration file
  ansible.builtin.include_vars:
    file: "{{ telemetry_config_file_path }}"
    name: telemetry_config

- name: Read telemetry packages from software config
  ansible.builtin.include_tasks: read_software_config.yml

- name: Load service images from service_k8s.json
  ansible.builtin.include_tasks: load_service_images.yml

- name: Configure of k8s telemetry service
  when:
    - hostvars['localhost']['idrac_telemetry_support'] or hostvars['localhost']['ldms_support']
  block:
    - name: Set NFS info fact
      ansible.builtin.set_fact:
        oim_shared_path: "{{ hostvars['localhost']['oim_shared_path'] }}"

    - name: Service cluster prerequisite
      ansible.builtin.include_tasks: telemetry_prereq.yml

    - name: Generate telemetry deployments
      ansible.builtin.include_tasks: generate_telemetry_deployments.yml

- name: Configure of k8s telemetry service
  when:
    - hostvars['localhost']['idrac_telemetry_support']
  block:
    - name: Validate idrac telemetry config
      ansible.builtin.include_tasks: validate_idrac_inventory.yml

    - name: Generate service cluster metadata
      ansible.builtin.include_tasks: generate_service_cluster_metadata.yml

- name: Include update_ldms_sampler.yml
  ansible.builtin.include_tasks: update_ldms_sampler.yml
  when: hostvars['localhost']['ldms_support']

- name: Update ldms agg configuration
  ansible.builtin.include_tasks: update_ldms_agg_config.yml
  when: hostvars['localhost']['ldms_support']

- name: Check if PXE mapping has changed since last run
  ansible.builtin.include_tasks: check_pxe_changes.yml
  when: hostvars['localhost']['ldms_support']

- name: Restart LDMS configs for node addition and deletion
  ansible.builtin.include_tasks: restart_ldms_configs.yml
  when:
    - hostvars['localhost']['ldms_support']
    - pxe_changed | default(false) | bool

- name: Apply telemetry configurations on upgrade
  ansible.builtin.include_tasks: apply_telemetry_on_upgrade.yml
  when:
    - hostvars['localhost']['upgrade_enabled'] | default(false) | bool


================================================
FILE: discovery/roles/telemetry/tasks/read_software_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Run pulp status command on omnia_core container
  ansible.builtin.command: /usr/local/bin/pulp status
  delegate_to: localhost
  changed_when: false
  register: pulp_status_output

- name: Set pulp content origin value
  ansible.builtin.set_fact:
    pulp_content_origin: "{{ (pulp_status_output.stdout | from_json).content_settings.content_origin }}"

- name: Set fact for pulp protocol
  ansible.builtin.set_fact:
    pulp_server_ip: "{{ pulp_content_origin | urlsplit('hostname') }}"

- name: Get cluster_os_type from software_config.json
  ansible.builtin.set_fact:
    cluster_os_type: "{{ software_config['cluster_os_type'] }}"

- name: Get cluster_os_version from software_config.json
  ansible.builtin.set_fact:
    cluster_os_version: "{{ software_config['cluster_os_version'] }}"

- name: Load service_k8s.json
  ansible.builtin.set_fact:
    telemetry_packages: "{{ lookup('file', k8s_packages_file) | from_json }}"

- name: Extract service_k8s.json and set facts for pip_modules and python_version
  ansible.builtin.set_fact:
    k8s_pip_packages: >-
      {{ telemetry_packages['service_kube_control_plane']['cluster']
        | selectattr('type', 'equalto', 'pip_module')
        | map(attribute='package')
        | list }}


================================================
FILE: discovery/roles/telemetry/tasks/restart_ldms_configs.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
- name: Load high availability config
  ansible.builtin.include_vars:
    file: "{{ hostvars['localhost']['input_project_dir'] }}/high_availability_config.yml"
    name: ha_config

- name: Set kube_vip fact
  ansible.builtin.set_fact:
    kube_vip: "{{ ha_config.service_k8s_cluster_ha[0].virtual_ip_address | default('') }}"

- name: Test SSH connectivity to kube VIP only when PXE has changed
  when:
    - kube_vip | length > 0
    - pxe_changed | default(false) | bool
  block:
    - name: SSH test to kube VIP
      ansible.builtin.command:
        cmd: "ssh -o StrictHostKeyChecking=no -o ConnectTimeout=10 -o BatchMode=yes {{ kube_vip }} echo reachable"
      delegate_to: localhost
      register: kube_vip_ssh_check
      changed_when: false

    - name: Set kube VIP reachable fact
      ansible.builtin.set_fact:
        kube_vip_reachable: "{{ kube_vip_ssh_check.rc == 0 }}"

  rescue:
    - name: Display kube VIP unreachable message
      ansible.builtin.debug:
        msg: "{{ kube_vip_unreachable_msg }}"

    - name: Set kube VIP reachable fact to false
      ansible.builtin.set_fact:
        kube_vip_reachable: false

- name: Restart LDMS aggregator when PXE has changed
  when: pxe_changed | default(false) | bool
  block:
    - name: Check if LDMS aggregator is running on service k8s cluster
      kubernetes.core.k8s_info:
        api_version: apps/v1
        kind: StatefulSet
        name: nersc-ldms-aggr
        namespace: "{{ telemetry_namespace }}"
      delegate_to: "{{ kube_vip }}"
      register: ldms_statefulset_info
      failed_when: false
      when:
        - kube_vip_reachable | bool

    - name: Set LDMS running state
      ansible.builtin.set_fact:
        ldms_running: "{{ ldms_statefulset_info.resources is defined and ldms_statefulset_info.resources | length > 0 }}"
      when:
        - kube_vip_reachable | bool

    - name: Check if LDMS conf ConfigMap file exists
      ansible.builtin.stat:
        path: "{{ hostvars['localhost']['k8s_client_share_path'] }}/telemetry/ldms/nersc-ldms-aggr/nersc-ldms-aggr/templates/cm.nersc-ldms-conf.yaml"
      register: ldms_conf_file
      when: ldms_running | default(false) | bool

    - name: Check if LDMS bin ConfigMap file exists
      ansible.builtin.stat:
        path: "{{ hostvars['localhost']['k8s_client_share_path'] }}/telemetry/ldms/nersc-ldms-aggr/nersc-ldms-aggr/templates/cm.nersc-ldms-bin.yaml"
      register: ldms_bin_file
      when: ldms_running | default(false) | bool

    - name: Apply LDMS configuration ConfigMap
      kubernetes.core.k8s:
        state: present
        src: "{{ hostvars['localhost']['k8s_client_share_path'] }}/telemetry/ldms/nersc-ldms-aggr/nersc-ldms-aggr/templates/cm.nersc-ldms-conf.yaml"
        namespace: "{{ telemetry_namespace }}"
      delegate_to: "{{ kube_vip }}"
      failed_when: false
      when:
        - ldms_running | default(false) | bool
        - ldms_conf_file.stat.exists | default(false)

    - name: Apply LDMS scripts ConfigMap
      kubernetes.core.k8s:
        state: present
        src: "{{ hostvars['localhost']['k8s_client_share_path'] }}/telemetry/ldms/nersc-ldms-aggr/nersc-ldms-aggr/templates/cm.nersc-ldms-bin.yaml"
        namespace: "{{ telemetry_namespace }}"
      delegate_to: "{{ kube_vip }}"
      failed_when: false
      when:
        - ldms_running | default(false) | bool
        - ldms_bin_file.stat.exists | default(false)

    - name: Restart LDMS aggregator StatefulSet
      kubernetes.core.k8s:
        state: present
        definition:
          apiVersion: apps/v1
          kind: StatefulSet
          metadata:
            name: nersc-ldms-aggr
            namespace: "{{ telemetry_namespace }}"
          spec:
            template:
              metadata:
                annotations:
                  kubectl.kubernetes.io/restartedAt: "{{ ansible_date_time.iso8601 }}"
      delegate_to: "{{ kube_vip }}"
      failed_when: false
      when:
        - ldms_running | default(false) | bool
        - ldms_conf_file.stat.exists | default(false)
        - ldms_bin_file.stat.exists | default(false)

    - name: Wait for LDMS aggregator pod to be ready after restart
      kubernetes.core.k8s_info:
        api_version: v1
        kind: Pod
        namespace: "{{ telemetry_namespace }}"
        label_selectors:
          - "app=nersc-ldms-aggr"
        wait: true
        wait_condition:
          type: Ready
          status: "True"
        wait_timeout: 120
      delegate_to: "{{ kube_vip }}"
      register: ldms_pod_ready
      failed_when: false
      when:
        - ldms_running | default(false) | bool
        - ldms_conf_file.stat.exists | default(false)
        - ldms_bin_file.stat.exists | default(false)

    - name: Display LDMS aggregator restart status
      ansible.builtin.debug:
        msg: "{{ ldms_pod_ready_msg if (ldms_pod_ready.resources | default([]) | length > 0) else ldms_pod_not_ready_msg }}"
      when:
        - ldms_running | default(false) | bool
        - ldms_conf_file.stat.exists | default(false)
        - ldms_bin_file.stat.exists | default(false)

    - name: Wait before restarting store daemon
      ansible.builtin.pause:
        seconds: "{{ ldms_store_restart_wait_seconds }}"
      when:
        - ldms_running | default(false) | bool
        - ldms_conf_file.stat.exists | default(false)
        - ldms_bin_file.stat.exists | default(false)

    - name: Check if LDMS store daemon is running on service k8s cluster
      kubernetes.core.k8s_info:
        api_version: v1
        kind: Pod
        namespace: "{{ telemetry_namespace }}"
        label_selectors:
          - "app=nersc-ldms-store"
      delegate_to: "{{ kube_vip }}"
      register: ldms_store_pod_info
      failed_when: false
      when:
        - kube_vip_reachable | bool
        - ldms_running | default(false) | bool

    - name: Set LDMS store daemon running state
      ansible.builtin.set_fact:
        ldms_store_running: "{{ ldms_store_pod_info.resources is defined and ldms_store_pod_info.resources | length > 0 }}"
      when:
        - kube_vip_reachable | bool
        - ldms_running | default(false) | bool

    - name: Restart LDMS store daemon pod
      kubernetes.core.k8s:
        state: absent
        api_version: v1
        kind: Pod
        name: "{{ ldms_store_pod_info.resources[0].metadata.name }}"
        namespace: "{{ telemetry_namespace }}"
      delegate_to: "{{ kube_vip }}"
      failed_when: false
      when:
        - ldms_store_running | default(false) | bool
        - ldms_conf_file.stat.exists | default(false)
        - ldms_bin_file.stat.exists | default(false)

    - name: Wait for LDMS store daemon pod to be ready after restart
      kubernetes.core.k8s_info:
        api_version: v1
        kind: Pod
        namespace: "{{ telemetry_namespace }}"
        label_selectors:
          - "app=nersc-ldms-store"
        wait: true
        wait_condition:
          type: Ready
          status: "True"
        wait_timeout: 120
      delegate_to: "{{ kube_vip }}"
      register: ldms_store_pod_ready
      failed_when: false
      when:
        - ldms_store_running | default(false) | bool
        - ldms_conf_file.stat.exists | default(false)
        - ldms_bin_file.stat.exists | default(false)

    - name: Display LDMS store daemon restart status
      ansible.builtin.debug:
        msg: >
          {{ ldms_store_pod_ready_msg
          if (ldms_store_pod_ready.resources | default([]) | length > 0)
          else ldms_store_pod_not_ready_msg }}
      when:
        - ldms_store_running | default(false) | bool
        - ldms_conf_file.stat.exists | default(false)
        - ldms_bin_file.stat.exists | default(false)


================================================
FILE: discovery/roles/telemetry/tasks/telemetry_prereq.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Initialize kafka_support
  ansible.builtin.set_fact:
    kafka_support: false

- name: Count entries with FUNCTIONAL_GROUP_NAME containing 'service_kube_node'
  ansible.builtin.set_fact:
    kube_node_count: >-
      {{
        hostvars['localhost']['read_mapping_file']['dict']
        | dict2items
        | selectattr('value.FUNCTIONAL_GROUP_NAME', 'search', 'service_kube_node')
        | list
        | length
      }}

- name: Mount NFS share (force NFSv3)
  ansible.posix.mount:
    src: "{{ hostvars['localhost']['k8s_server_ip'] }}:{{ hostvars['localhost']['k8s_server_share_path'] }}"
    path: "{{ hostvars['localhost']['k8s_client_share_path'] }}"
    fstype: nfs
    opts: "{{ hostvars['localhost']['k8s_mount_options'] }},vers=3"
    state: mounted

- name: Delete existing telemetry deployment directory
  ansible.builtin.file:
    path: "{{ hostvars['localhost']['k8s_client_share_path'] }}/telemetry/deployments"
    state: absent

- name: Create telemetry deployment directory
  ansible.builtin.file:
    path: "{{ hostvars['localhost']['k8s_client_share_path'] }}/telemetry/deployments"
    state: directory
    mode: "{{ hostvars['localhost']['dir_permissions_755'] }}"

- name: Ensure iDRAC Telemetry scripting destination exists
  ansible.builtin.file:
    path: "{{ idrac_telemetry_scripting_git_clone_path }}"
    state: directory
    mode: "{{ hostvars['localhost']['dir_permissions_755'] }}"

- name: Copy iDRAC Telemetry Scripting to NFS share
  block:
    - name: Copy pre-cloned iDRAC Telemetry Scripting directory
      ansible.builtin.copy:
        src: "{{ idrac_telemetry_scripting_src_path }}/"
        dest: "{{ idrac_telemetry_scripting_git_clone_path }}"
        remote_src: true
        mode: preserve
  rescue:
    - name: Fail if iDRAC telemetry copy fails
      ansible.builtin.fail:
        msg: "{{ idrac_telemetry_scripting_copy_fail_msg.splitlines() | join(' ') }}"

- name: Set kafka_support to true
  ansible.builtin.set_fact:
    kafka_support: true
  when: "'kafka' in hostvars['localhost']['idrac_telemetry_collection_type'].split(',') or hostvars['localhost']['ldms_support']"

- name: Configure TLS certificate and secrets for kafka
  when: kafka_support
  block:
    - name: Check if telemetry secrets config file exists
      ansible.builtin.stat:
        path: "{{ hostvars['localhost']['k8s_client_share_path'] }}/telemetry/deployments/telemetry_secret_creation.yaml"
      register: telemetry_config_file

    - name: Read telemetry secrets config file
      ansible.builtin.slurp:
        src: "{{ telemetry_config_file.stat.path }}"
      register: telemetry_config_raw
      when: telemetry_config_file.stat.exists
      no_log: true

    - name: Check if Kafka Cluster ID is present in the file
      ansible.builtin.set_fact:
        cluster_id_present: >-
          {{ 'cluster-id' in (telemetry_config_raw.content | b64decode | default('')) }}
      when: telemetry_config_file.stat.exists

    - name: Generate cluster ID
      ansible.builtin.command: uuidgen
      register: cluster_id
      changed_when: false
      no_log: true
      when: not cluster_id_present | default(false)

- name: Configure TLS certificate for VictoriaMetrics
  when: "'victoria' in hostvars['localhost']['idrac_telemetry_collection_type']"
  block:
    - name: Create VictoriaMetrics certificate directory
      ansible.builtin.file:
        path: "{{ victoria_cert_dir }}"
        state: directory
        mode: "{{ dir_permissions_755 }}"

    - name: Deploy VictoriaMetrics certificate generation script
      ansible.builtin.template:
        src: telemetry/victoria/gen_victoria_certs.sh.j2
        dest: "{{ hostvars['localhost']['k8s_client_share_path'] }}/telemetry/deployments/gen_victoria_certs.sh"
        mode: "{{ hostvars['localhost']['file_permissions_755'] }}"

    - name: Generate VictoriaMetrics TLS certificates
      ansible.builtin.command:
        cmd: "{{ hostvars['localhost']['k8s_client_share_path'] }}/telemetry/deployments/gen_victoria_certs.sh"
      changed_when: false

    - name: Read VictoriaMetrics server certificate
      ansible.builtin.slurp:
        src: "{{ victoria_cert_dir }}/server.crt"
      register: victoria_server_cert
      no_log: true

    - name: Read VictoriaMetrics server key
      ansible.builtin.slurp:
        src: "{{ victoria_cert_dir }}/server.key"
      register: victoria_server_key
      no_log: true

    - name: Read VictoriaMetrics CA certificate
      ansible.builtin.slurp:
        src: "{{ victoria_cert_dir }}/ca.crt"
      register: victoria_ca_cert
      no_log: true

    - name: Set certificate variables for template
      ansible.builtin.set_fact:
        victoria_server_cert_b64: "{{ victoria_server_cert.content }}"
        victoria_server_key_b64: "{{ victoria_server_key.content }}"
        victoria_ca_cert_b64: "{{ victoria_ca_cert.content }}"
      no_log: true

    - name: Create VictoriaMetrics TLS secret manifest with actual certificates
      ansible.builtin.template:
        src: telemetry/victoria/victoria-tls-secret.yaml.j2
        dest: "{{ hostvars['localhost']['k8s_client_share_path'] }}/telemetry/deployments/victoria-tls-secret.yaml"
        mode: "{{ hostvars['localhost']['file_permissions_644'] }}"


================================================
FILE: discovery/roles/telemetry/tasks/update_ldms_agg_config.yml
================================================
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Verify values.yaml exists
  ansible.builtin.stat:
    path: "{{ hostvars['localhost']['k8s_client_share_path'] }}/telemetry/ldms/nersc-ldms-aggr/values.yaml"
  register: values_file_exists

- name: Copy ldms files dir to telemetry nfs share
  ansible.builtin.copy:
    src: files/nersc-ldms-aggr
    dest: "{{ hostvars['localhost']['k8s_client_share_path'] }}/telemetry/ldms"
    mode: '0755'
  when: not values_file_exists.stat.exists

- name: Copy ldms decompose.json
  ansible.builtin.copy:
    src: files/nersc-ldms-aggr/scripts/decomp.json
    dest: "{{ hostvars['localhost']['k8s_client_share_path'] }}/telemetry/ldms/nersc-ldms-aggr/scripts/decomp.json"
    mode: "{{ hostvars['localhost']['file_permissions_644'] }}"

- name: Generate ldms_machine_config.json from template
  ansible.builtin.template:
    src: 'telemetry/ldms/ldms_machine_config.json.j2'
    dest: "{{ hostvars['localhost']['k8s_client_share_path'] }}/telemetry/ldms/nersc-ldms-aggr/ldms_machine_config.json"
    mode: "{{ hostvars['localhost']['file_permissions_644'] }}"

- name: Generate hostmap for ldms
  ansible.builtin.template:
    src: 'telemetry/ldms/host_map.slurm-cluster.json.j2'
    dest: "{{ hostvars['localhost']['k8s_client_share_path'] }}/telemetry/ldms/nersc-ldms-aggr/host_map.slurm-cluster.json"
    mode: "{{ hostvars['localhost']['file_permissions_644'] }}"
  vars:
    nodes: "{{ hostvars['localhost']['read_mapping_file']['dict'] | dict2items }}"

- name: Clean up previous build artifacts before make
  ansible.builtin.file:
    path: "{{ hostvars['localhost']['k8s_client_share_path'] }}/telemetry/ldms/nersc-ldms-aggr/{{ item }}"
    state: absent
  failed_when: false
  loop:
    - out_dir
    - manifest.yaml
    - values.yaml

- name: Run make command inside ldms directory
  ansible.builtin.shell: make clean all && make
  changed_when: true
  args:
    chdir: "{{ hostvars['localhost']['k8s_client_share_path'] }}/telemetry/ldms/nersc-ldms-aggr"

- name: Copy values.yaml to ldms directory
  ansible.builtin.template:
    src: "telemetry/ldms/values.yaml.j2"
    dest: "{{ hostvars['localhost']['k8s_client_share_path'] }}/telemetry/ldms/nersc-ldms-aggr/values.yaml"
    mode: "{{ hostvars['localhost']['file_permissions_644'] }}"

- name: Copy munge key from slurm config to ldms dir
  ansible.builtin.copy:
    src: "{{ slurm_config_path }}/munge.key"
    dest: "{{ hostvars['localhost']['k8s_client_share_path'] }}/telemetry/ldms/munge.key"
    mode: "{{ hostvars['localhost']['file_permissions_400'] }}"
    remote_src: true

- name: Load ldmsauth.conf to ldms dir
  ansible.builtin.template:
    src: "telemetry/ldms/ldmsauth.conf.j2"
    dest: "{{ hostvars['localhost']['k8s_client_share_path'] }}/telemetry/ldms/ldmsauth.conf"
    mode: "{{ hostvars['localhost']['file_permissions_600'] }}"


================================================
FILE: discovery/roles/telemetry/tasks/update_ldms_sampler.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
- name: Create LDMS directory in NFS share path
  ansible.builtin.file:
    path: "{{ share_path }}/ldms/samplers"
    state: directory
    owner: root
    group: root
    mode: "{{ common_mode }}"

- name: Copy LDMS sampler configuration files to NFS share
  ansible.builtin.template:
    src: "telemetry/ldms/sampler.conf.j2"
    dest: "{{ share_path }}/ldms/samplers/sampler.conf"
    owner: root
    group: root
    mode: "{{ hostvars['localhost']['file_permissions_644'] }}"

- name: Load ldmsauth.conf to ldms dir
  ansible.builtin.template:
    src: "telemetry/ldms/ldmsauth.conf.j2"
    dest: "{{ share_path }}/ldms/samplers/ldmsauth.conf"
    owner: root
    group: root
    mode: "{{ hostvars['localhost']['file_permissions_600'] }}"

- name: Copy ldmsd.sampler.env to LDMS samplers directory
  ansible.builtin.template:
    src: "telemetry/ldms/ldmsd.sampler.env.j2"
    dest: "{{ share_path }}/ldms/samplers/ldmsd.sampler.env"
    owner: root
    group: root
    mode: "{{ hostvars['localhost']['file_permissions_644'] }}"


================================================
FILE: discovery/roles/telemetry/tasks/validate_idrac_inventory.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Read BMC group data
  ansible.builtin.set_fact:
    bmc_group_data: "{{ lookup('file', bmc_group_data_filename).splitlines() }}"

- name: Include nodes vars
  ansible.builtin.slurp:
    src: "{{ openchami_nodes_vars_path }}"
  register: nodes_vars

- name: Decode and parse nodes_vars YAML
  ansible.builtin.set_fact:
    node_parsed_yaml: "{{ nodes_vars.content | b64decode | from_yaml }}"

- name: Validate BMC group data file
  validate_bmc_group_data:
    nodes_bmc_ips: "{{ node_parsed_yaml.nodes | map(attribute='bmc_ip') | list }}"
    bmc_group_data_headers: "{{ bmc_group_data_headers }}"
    bmc_group_data: "{{ bmc_group_data }}"
    bmc_group_data_file: "{{ bmc_group_data_filename }}"
  register: bmc_ip_data

- name: Set validated BMC ips
  ansible.builtin.set_fact:
    bmc_dict_list: "{{ bmc_ip_data.bmc_dict_list }}"
    bmc_ips: "{{ bmc_ip_data.bmc_ips }}"


================================================
FILE: discovery/roles/telemetry/templates/telemetry/cleanup_telemetry.sh.j2
================================================
#!/bin/bash
#
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#
#
# Telemetry Stack Cleanup Script
# Removes Kafka, LDMS, iDRAC telemetry, and monitoring resources from the {{ telemetry_namespace }} namespace
#
# Usage: ./cleanup_telemetry.sh [kafka] [ldms] [idrac] [victoria] [all]
#   kafka    - Delete Kafka cluster, users, and bridge
#   ldms     - Delete LDMS aggregator and store
#   idrac    - Delete iDRAC telemetry
#   victoria - Delete VictoriaMetrics monitoring
#   all      - Delete everything (default if no arguments)
#

set -e

NAMESPACE="{{ telemetry_namespace }}"

# Parse arguments
CLEAN_KAFKA=false
CLEAN_LDMS=false
CLEAN_IDRAC=false
CLEAN_VICTORIA=false
CLEAN_ALL=false

if [ $# -eq 0 ]; then
    CLEAN_ALL=true
else
    for arg in "$@"; do
        case $arg in
            kafka)
                CLEAN_KAFKA=true
                ;;
            ldms)
                CLEAN_LDMS=true
                ;;
            idrac)
                CLEAN_IDRAC=true
                ;;
            victoria)
                CLEAN_VICTORIA=true
                ;;
            all)
                CLEAN_ALL=true
                ;;
            -h|--help)
                echo "Usage: $0 [kafka] [ldms] [idrac] [victoria] [all]"
                echo ""
                echo "Options:"
                echo "  kafka    - Delete Kafka cluster, users, and bridge"
                echo "  ldms     - Delete LDMS aggregator and store"
                echo "  idrac    - Delete iDRAC telemetry"
                echo "  victoria - Delete VictoriaMetrics monitoring"
                echo "  all      - Delete everything (default if no arguments)"
                echo ""
                echo "Examples:"
                echo "  $0                    # Delete everything"
                echo "  $0 all                # Delete everything"
                echo "  $0 kafka ldms         # Delete only Kafka and LDMS"
                echo "  $0 idrac victoria     # Delete only iDRAC and Victoria"
                exit 0
                ;;
            *)
                echo "Unknown option: $arg"
                echo "Use --help for usage information"
                exit 1
                ;;
        esac
    done
fi

# If CLEAN_ALL is true, enable all cleanup flags
if [ "$CLEAN_ALL" = true ]; then
    CLEAN_KAFKA=true
    CLEAN_LDMS=true
    CLEAN_IDRAC=true
    CLEAN_VICTORIA=true
fi

echo "=========================================="
echo "  Telemetry Stack Cleanup"
echo "=========================================="
echo ""
echo "Components to clean:"
echo "  Kafka Bridge:    $([ "$CLEAN_KAFKA" = true ] && echo "YES" || echo "NO")"
echo "  Kafka Cluster:   $([ "$CLEAN_KAFKA" = true ] && echo "YES" || echo "NO")"
echo "  LDMS:            $([ "$CLEAN_LDMS" = true ] && echo "YES" || echo "NO")"
echo "  iDRAC Telemetry: $([ "$CLEAN_IDRAC" = true ] && echo "YES" || echo "NO")"
echo "  Victoria Metrics:$([ "$CLEAN_VICTORIA" = true ] && echo "YES" || echo "NO")"
echo ""
read -p "Continue? (y/N): " -n 1 -r
echo
if [[ ! $REPLY =~ ^[Yy]$ ]]; then
    echo "Cleanup cancelled."
    exit 0
fi
echo ""

# Function to delete resource with retry
delete_resource() {
    local resource=$1
    local name=$2
    echo "Deleting $resource: $name"
    kubectl -n $NAMESPACE delete $resource $name --ignore-not-found=true --wait=false 2>/dev/null || true
}

# Function to delete all resources of a type with label selector
delete_all() {
    local resource=$1
    local label=$2
    if [ -z "$label" ]; then
        echo "Deleting all $resource resources..."
        kubectl -n $NAMESPACE delete $resource --all --ignore-not-found=true --wait=false 2>/dev/null || true
    else
        echo "Deleting $resource resources with label $label..."
        kubectl -n $NAMESPACE delete $resource -l $label --ignore-not-found=true --wait=false 2>/dev/null || true
    fi
}

if [ "$CLEAN_KAFKA" = true ]; then
    echo "Step 1: Delete Kafka Bridge"
    echo "----------------------------"
    delete_resource kafkabridge bridge
    delete_resource service bridge-bridge-service
    delete_resource service bridge-bridge-lb
    delete_resource deployment bridge-bridge
    sleep 2
    echo ""
fi

if [ "$CLEAN_IDRAC" = true ]; then
    echo "Step 2: Delete iDRAC Telemetry"
    echo "-------------------------------"
    delete_resource statefulset idrac-telemetry
    delete_resource service idrac-telemetry-headless
    delete_resource service idrac-telemetry-service
    delete_resource configmap idrac-telemetry-config
    delete_all pod "app=idrac-telemetry"
    sleep 2
    echo ""
fi

if [ "$CLEAN_LDMS" = true ]; then
    echo "Step 3: Delete LDMS Helm Releases"
    echo "----------------------------------"
    # Check if Helm releases exist and delete them
    if helm list -n $NAMESPACE 2>/dev/null | grep -q "nersc-ldms-aggr"; then
        echo "Deleting Helm release: nersc-ldms-aggr"
        helm delete nersc-ldms-aggr -n $NAMESPACE 2>/dev/null || true
    fi

    if helm list -n $NAMESPACE 2>/dev/null | grep -q "nersc-ldms-store"; then
        echo "Deleting Helm release: nersc-ldms-store"
        helm delete nersc-ldms-store -n $NAMESPACE 2>/dev/null || true
    fi

    # Wait for Helm resources to be deleted
    sleep 5

    # Clean up any remaining LDMS resources
    echo "Cleaning up remaining LDMS resources..."
    # LDMS StatefulSets
    delete_resource statefulset nersc-ldms-aggr
    delete_resource statefulset nersc-ldms-store-slurm-cluster
    delete_resource statefulset nersc-ldms-store-slurm-cluster-0
    delete_resource statefulset nersc-ldms-aggr-0

    # LDMS Services
    delete_resource service nersc-ldms-aggr
    delete_resource service nersc-ldms-store
    delete_resource service nersc-ldms-store-slurm-cluster-0
    delete_resource service nersc-ldms-aggr-0

    # LDMS ConfigMaps
    delete_resource configmap nersc-ldms-store-slurm-cluster-0-config
    delete_resource configmap nersc-ldms-aggr-0-config

    # Delete any LDMS pods
    delete_all pod "app=nersc-ldms"
    

    sleep 2
    echo ""
fi

if [ "$CLEAN_KAFKA" = true ]; then
    echo "Step 4: Delete Kafka Users"
    echo "--------------------------"
    delete_resource kafkauser kafkapump
    sleep 2

    echo ""
    echo "Step 5: Delete Kafka Cluster"
    echo "-----------------------------"
    delete_resource kafka kafka
    echo "Waiting for Kafka cluster to terminate (this may take 2-3 minutes)..."
    kubectl -n $NAMESPACE wait --for=delete kafka/kafka --timeout=300s 2>/dev/null || true
    sleep 5

    echo ""
    echo "Step 6: Delete Kafka Node Pools"
    echo "--------------------------------"
    delete_resource kafkanodepool broker
    delete_resource kafkanodepool controller
    sleep 2
    echo ""
fi

if [ "$CLEAN_KAFKA" = true ] || [ "$CLEAN_LDMS" = true ] || [ "$CLEAN_IDRAC" = true ] || [ "$CLEAN_VICTORIA" = true ]; then
    echo "Step 7: Delete Persistent Volume Claims"
    echo "----------------------------------------"
    if [ "$CLEAN_KAFKA" = true ]; then
        delete_all pvc "strimzi.io/cluster=kafka"
    fi
    if [ "$CLEAN_LDMS" = true ]; then
        delete_all pvc "app=nersc-ldms"
    fi
    if [ "$CLEAN_IDRAC" = true ]; then
        delete_all pvc "app=idrac-telemetry"
    fi
    if [ "$CLEAN_VICTORIA" = true ]; then
        # Delete single-node PVCs
        delete_all pvc "app=victoria-metric"
        delete_resource pvc victoria-metrics-pvc-victoria-metric-0
        # Delete cluster mode PVCs (vmstorage StatefulSet PVCs)
        delete_all pvc "app=vmstorage"
        for i in {0..9}; do
            delete_resource pvc vmstorage-data-vmstorage-$i
        done
    fi
    sleep 2
    echo ""
fi

if [ "$CLEAN_KAFKA" = true ]; then
    echo "Step 8: Delete Kafka Secrets"
    echo "-----------------------------"
    delete_all secret "strimzi.io/cluster=kafka"
    delete_resource secret kafka-cluster-ca-cert
    delete_resource secret kafka-cluster-ca
    delete_resource secret kafka-clients-ca
    delete_resource secret kafkapump
    delete_resource secret kafka-secrets
    delete_resource secret kafka-cluster-id
    sleep 2
    echo ""
fi

if [ "$CLEAN_LDMS" = true ]; then
    echo "Step 8a: Delete LDMS Secrets"
    echo "-----------------------------"
    delete_resource secret nersc-ldms-ovis-auth
    delete_resource secret nersc-munge-key
    sleep 2
    echo ""
fi

if [ "$CLEAN_IDRAC" = true ]; then
    echo "Step 8b: Delete MySQL Secrets"
    echo "------------------------------"
    delete_resource secret mysqldb-credentials
    sleep 2
    echo ""
fi

if [ "$CLEAN_KAFKA" = true ] || [ "$CLEAN_LDMS" = true ] || [ "$CLEAN_IDRAC" = true ] || [ "$CLEAN_VICTORIA" = true ]; then
    echo "Step 9: Delete ConfigMaps"
    echo "-------------------------"
    if [ "$CLEAN_KAFKA" = true ]; then
        delete_all configmap "app=kafka"
        delete_resource configmap kafka-tls-test-script
    fi
    if [ "$CLEAN_LDMS" = true ]; then
        delete_all configmap "app=nersc-ldms"
    fi
    if [ "$CLEAN_IDRAC" = true ]; then
        delete_all configmap "app=idrac-telemetry"
    fi
    if [ "$CLEAN_VICTORIA" = true ]; then
        delete_resource configmap victoria-tls-test-script
    fi
    sleep 2
    echo ""
fi

if [ "$CLEAN_KAFKA" = true ] || [ "$CLEAN_VICTORIA" = true ]; then
    echo "Step 10: Delete TLS Test Jobs"
    echo "------------------------------"
    if [ "$CLEAN_KAFKA" = true ]; then
        delete_resource job kafka-tls-test
    fi
    if [ "$CLEAN_VICTORIA" = true ]; then
        delete_resource job victoria-tls-test
    fi
    sleep 2
    echo ""
fi

if [ "$CLEAN_KAFKA" = true ] || [ "$CLEAN_VICTORIA" = true ]; then
    echo "Step 11: Delete Services"
    echo "------------------------"
    if [ "$CLEAN_KAFKA" = true ]; then
        delete_resource service kafka-kafka-bootstrap
        delete_resource service kafka-kafka-brokers
        delete_resource service kafka-kafka-controllers
    fi
    if [ "$CLEAN_VICTORIA" = true ]; then
        delete_resource service victoria-metric
        delete_resource service vmselect
        delete_resource service vminsert
        delete_resource service vmstorage
        delete_resource service vmagent
    fi
    sleep 2
    echo ""
fi

if [ "$CLEAN_VICTORIA" = true ]; then
    echo "Step 12: Delete Monitoring Resources"
    echo "-------------------------------------"
    
    # Delete VictoriaMetrics cluster components (if cluster mode is deployed)
    echo "Deleting VictoriaMetrics cluster components..."
    delete_resource deployment vmselect
    delete_resource deployment vminsert
    delete_resource statefulset vmstorage
    delete_resource service vmselect
    delete_resource service vminsert
    delete_resource service vmstorage
    delete_all pod "app=vmselect"
    delete_all pod "app=vminsert"
    delete_all pod "app=vmstorage"
    
    # Delete VictoriaMetrics single-node components (if single-node mode is deployed)
    echo "Deleting VictoriaMetrics single-node components..."
    delete_resource statefulset victoria-metric
    delete_resource service victoria-loadbalancer
    delete_resource service victoria-metric
    delete_all pod "app=victoria-metric"
    
    # Delete vmagent (common to both modes)
    echo "Deleting vmagent..."
    delete_resource deployment vmagent
    delete_resource service vmagent
    delete_all pod "app=vmagent"
    
    # Delete shared resources
    echo "Deleting VictoriaMetrics shared resources..."
    delete_resource configmap vmagent-config
    delete_resource configmap vmagent-scrape-config
    delete_resource configmap victoria-metric-config
    delete_resource secret victoria-tls-certs
    delete_resource serviceaccount vmagent
    delete_resource role vmagent-sd
    delete_resource rolebinding vmagent-sd-binding
    
    sleep 2
    echo ""
fi

echo ""
echo "Step 13: Force Delete Any Remaining Component Pods"
echo "---------------------------------------------------"
# Only force delete pods from components being cleaned
if [ "$CLEAN_KAFKA" = true ]; then
    kubectl -n $NAMESPACE delete pod -l strimzi.io/cluster=kafka --grace-period=0 --force --ignore-not-found=true 2>/dev/null || true
    kubectl -n $NAMESPACE delete pod -l app.kubernetes.io/name=kafka-bridge --grace-period=0 --force --ignore-not-found=true 2>/dev/null || true
    kubectl -n $NAMESPACE delete pod -l app=kafka-tls-test --grace-period=0 --force --ignore-not-found=true 2>/dev/null || true
fi
if [ "$CLEAN_LDMS" = true ]; then
    kubectl -n $NAMESPACE delete pod -l app=nersc-ldms --grace-period=0 --force --ignore-not-found=true 2>/dev/null || true
fi
if [ "$CLEAN_IDRAC" = true ]; then
    kubectl -n $NAMESPACE delete pod -l app=idrac-telemetry --grace-period=0 --force --ignore-not-found=true 2>/dev/null || true
fi
if [ "$CLEAN_VICTORIA" = true ]; then
    kubectl -n $NAMESPACE delete pod -l app=victoria-metric --grace-period=0 --force --ignore-not-found=true 2>/dev/null || true
    kubectl -n $NAMESPACE delete pod -l app=vmselect --grace-period=0 --force --ignore-not-found=true 2>/dev/null || true
    kubectl -n $NAMESPACE delete pod -l app=vminsert --grace-period=0 --force --ignore-not-found=true 2>/dev/null || true
    kubectl -n $NAMESPACE delete pod -l app=vmstorage --grace-period=0 --force --ignore-not-found=true 2>/dev/null || true
    kubectl -n $NAMESPACE delete pod -l app=vmagent --grace-period=0 --force --ignore-not-found=true 2>/dev/null || true
    kubectl -n $NAMESPACE delete pod -l app=victoria-tls-test --grace-period=0 --force --ignore-not-found=true 2>/dev/null || true
fi
sleep 5

echo ""
echo "Step 14: Check for Remaining Resources"
echo "---------------------------------------"
if [ "$CLEAN_KAFKA" = true ]; then
    echo "Remaining Kafka resources:"
    kubectl -n $NAMESPACE get kafka,kafkauser,kafkabridge,kafkanodepool 2>/dev/null || echo "  None"
    echo ""
fi
if [ "$CLEAN_LDMS" = true ]; then
    echo "Remaining LDMS resources:"
    kubectl -n $NAMESPACE get statefulset,pod,configmap -l app=nersc-ldms 2>/dev/null || echo "  None"
    echo ""
fi
if [ "$CLEAN_IDRAC" = true ]; then
    echo "Remaining iDRAC resources:"
    kubectl -n $NAMESPACE get statefulset,pod,configmap -l app=idrac-telemetry 2>/dev/null || echo "  None"
    echo ""
fi
if [ "$CLEAN_VICTORIA" = true ]; then
    echo "Remaining Victoria Metrics resources:"
    echo "  Single-node:"
    kubectl -n $NAMESPACE get statefulset,deployment,pod,configmap -l app=victoria-metric 2>/dev/null || echo "    None"
    echo "  Cluster (vmselect):"
    kubectl -n $NAMESPACE get deployment,pod -l app=vmselect 2>/dev/null || echo "    None"
    echo "  Cluster (vminsert):"
    kubectl -n $NAMESPACE get deployment,pod -l app=vminsert 2>/dev/null || echo "    None"
    echo "  Cluster (vmstorage):"
    kubectl -n $NAMESPACE get statefulset,pod -l app=vmstorage 2>/dev/null || echo "    None"
    echo "  vmagent:"
    kubectl -n $NAMESPACE get deployment,pod -l app=vmagent 2>/dev/null || echo "    None"
    echo ""
fi
echo "Remaining PVCs:"
kubectl -n $NAMESPACE get pvc 2>/dev/null || echo "  None"
echo ""
echo "Remaining Network Policies:"
kubectl -n $NAMESPACE get networkpolicy 2>/dev/null || echo "  None"
echo ""
echo "All pods:"
kubectl -n $NAMESPACE get pods 2>/dev/null || echo "  None"

echo ""
echo "=========================================="
echo "  Cleanup Complete!"
echo "=========================================="
echo ""

# Only show operator prompt if Kafka was cleaned
if [ "$CLEAN_KAFKA" = true ]; then
    echo ""
    echo "=========================================="
    echo "  Strimzi Cluster Operator Cleanup"
    echo "=========================================="
    echo ""
    echo "The Strimzi Cluster Operator is still running."
    echo "Do you want to delete it as well?"
    echo ""
    read -p "Delete Strimzi Cluster Operator? (y/N): " -n 1 -r
    echo
    if [[ $REPLY =~ ^[Yy]$ ]]; then
        echo ""
        echo "Deleting Strimzi Cluster Operator..."
        kubectl -n $NAMESPACE delete deployment strimzi-cluster-operator --ignore-not-found=true --wait=false 2>/dev/null || true
        kubectl -n $NAMESPACE delete secret sh.helm.release.v1.strimzi-cluster-operator.v1 --ignore-not-found=true 2>/dev/null || true
        echo "Strimzi Cluster Operator deleted."
    else
        echo "Strimzi Cluster Operator was NOT deleted."
    fi
    echo ""
fi

echo "To delete the entire namespace:"
echo "  kubectl delete namespace $NAMESPACE"
echo ""


================================================
FILE: discovery/roles/telemetry/templates/telemetry/common/telemetry_cleaner_rbac.yaml.j2
================================================
---
apiVersion: v1
kind: ServiceAccount
metadata:
  name: telemetry-cleaner
  namespace: telemetry
---
apiVersion: rbac.authorization.k8s.io/v1
kind: ClusterRole
metadata:
  name: pod-cleaner-role
rules:
- apiGroups: [""]
  resources: ["pods"]
  verbs: ["get", "list", "create", "patch", "delete"]
- apiGroups: [""]
  resources: ["persistentvolumeclaims"]
  verbs: ["get", "list"]
---
apiVersion: rbac.authorization.k8s.io/v1
kind: ClusterRoleBinding
metadata:
  name: pod-cleaner-binding
roleRef:
  apiGroup: rbac.authorization.k8s.io
  kind: ClusterRole
  name: pod-cleaner-role
subjects:
- kind: ServiceAccount
  name: telemetry-cleaner
  namespace: telemetry


================================================
FILE: discovery/roles/telemetry/templates/telemetry/common/telemetry_namespace_creation.yaml.j2
================================================
---
apiVersion: v1
kind: Namespace
metadata:
  name: telemetry


================================================
FILE: discovery/roles/telemetry/templates/telemetry/common/telemetry_pod_cleanup.yaml.j2
================================================
---
apiVersion: batch/v1
kind: CronJob
metadata:
  name: pod-cleanup
  namespace: telemetry
spec:
  schedule: "*/3 * * * *" # Every 3 minutes
  successfulJobsHistoryLimit: 1   # Keep only 1 successful job
  failedJobsHistoryLimit: 1       # Keep only 1 failed job
  jobTemplate:
    spec:
      ttlSecondsAfterFinished: 60 # Auto-delete job and pod after 60s
      activeDeadlineSeconds: 180 # Kill job if it runs longer than 3 minutes
      template:
        spec:
          tolerations:
          - effect: NoExecute
            key: node.kubernetes.io/not-ready
            operator: Exists
            tolerationSeconds: 30  # Evict after 30s if node is not ready
          - effect: NoExecute
            key: node.kubernetes.io/unreachable
            operator: Exists
            tolerationSeconds: 30  # Evict after 30s if node is unreachable
          containers:
          - name: kubectl-cleanup
            image: docker.io/alpine/kubectl:1.34.1
            command:
            - /bin/sh
            - -c
            - |
              apk add --no-cache coreutils
              set -e

              # Get all terminating pods
              terminating=$(kubectl get pods -n telemetry -o jsonpath='{range .items[?(@.metadata.deletionTimestamp)]}{.metadata.name}{"\n"}{end}')

              if [ -z "$terminating" ]; then
                echo "No terminating pods found"
              else
              now=$(date +%s)

                for pod in $terminating; do
                  deletion_ts=$(kubectl get pod "$pod" -n telemetry -o jsonpath='{.metadata.deletionTimestamp}' 2>/dev/null)
                  if [ -z "$deletion_ts" ]; then
                    continue
                  fi

                  deletion_time=$(date -d "$deletion_ts" +%s || echo 0)
                  age=$((now - deletion_time))

                  # Check age threshold (300s for Kafka, 60s for others)
                  threshold=60
                  if echo "$pod" | grep -q "kafka"; then
                    threshold=300
                  fi

                  if [ $age -gt $threshold ]; then
                    echo "→ Pod $pod stuck for $age seconds. Processing..."

                    # Get PVCs BEFORE deleting pod
                    pvcs=$(kubectl get pod "$pod" -n telemetry -o jsonpath='{.spec.volumes[*].persistentVolumeClaim.claimName}' 2>/dev/null)

                    # Delete pod
                    if ! echo "$pod" | grep -q "kafka"; then
                      kubectl patch pod "$pod" -n telemetry -p '{"metadata":{"finalizers":[]}}' --type=merge 2>/dev/null || true
                    fi
                    kubectl delete pod "$pod" -n telemetry --grace-period=0 --force 2>/dev/null || true

                    # Clean PVCs if any
                    if [ -n "$pvcs" ]; then
                      for pvc in $pvcs; do
                        echo "  → Cleaning $pvc..."
                        cleanup_pod="pvc-clean-$RANDOM"

                        # Create cleanup pod - remove lock files recursively
                        kubectl run $cleanup_pod --image=busybox:1.36 -n telemetry --restart=Never \
                          --overrides="{\"spec\":{\"containers\":[{\"name\":\"cleanup\",\"image\":\"busybox:1.36\",\"command\":[\"sh\",\"-c\",\"echo 'Cleaning lock files in /data...'; find /data -type f \\\\( -name '.lock' -o -name '*.lock' -o -name '*.sock' -o -name '*.pid' \\\\) -exec rm -fv {} \\\\; 2>/dev/null || true; echo 'Done'\"],\"volumeMounts\":[{\"name\":\"data\",\"mountPath\":\"/data\"}]}],\"volumes\":[{\"name\":\"data\",\"persistentVolumeClaim\":{\"claimName\":\"$pvc\"}}]}}" \
                          2>/dev/null || echo " Failed to create $cleanup_pod"

                        # Wait for it to complete (max 20s), then show logs and delete
                        if kubectl wait --for=condition=Ready pod/$cleanup_pod -n telemetry --timeout=20s 2>/dev/null; then
                          kubectl logs $cleanup_pod -n telemetry 2>/dev/null | head -20
                        else
                          echo "$cleanup_pod timed out (PVC may be in use)"
                        fi
                        kubectl delete pod $cleanup_pod -n telemetry 2>/dev/null || true
                      done
                      echo "  Cleaned PVCs for $pod"
                    fi
              else
                    echo "Pod $pod terminating for $age seconds (threshold: ${threshold}s). Skipping."
                  fi
                done
              fi

              echo "Cleanup complete"

              exit 0
          restartPolicy: Never
          serviceAccountName: telemetry-cleaner


================================================
FILE: discovery/roles/telemetry/templates/telemetry/common/telemetry_secret_creation.yaml.j2
================================================
apiVersion: v1
kind: Secret
metadata:
  name: "{{ mysqldb_secrets_name }}"
  namespace: "{{ telemetry_namespace }}"
type: Opaque
data:
  mysqldb_user: "{{ hostvars['localhost']['mysqldb_user'] | b64encode }}"
  mysqldb_password: "{{ hostvars['localhost']['mysqldb_password'] | b64encode }}"
  mysqldb_root_password: "{{ hostvars['localhost']['mysqldb_root_password'] | b64encode }}"

{% set types = hostvars['localhost']['idrac_telemetry_collection_type'].split(',') %}
{% if 'kafka' in types %}
---
apiVersion: v1
kind: Secret
metadata:
  name: "{{ kafka.cluster_id }}"
  namespace: "{{ telemetry_namespace }}"
type: Opaque
stringData:
  cluster-id: "{{ cluster_id.stdout }}"
{% endif %}

================================================
FILE: discovery/roles/telemetry/templates/telemetry/idrac_telemetry/idrac_telemetry_statefulset.yaml.j2
================================================
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

apiVersion: v1
kind: Service
metadata:
  name: "{{ idrac_telemetry_service_name }}"
  namespace: "{{ telemetry_namespace }}"
  labels:
    app: "{{ idrac_telemetry_service_name }}"
spec:
  clusterIP: None
  ports:
    - name: mysql-port-1
      port: {{ mysqldb_container_port1 }}
    - name: mysql-port-2
      port: {{ mysqldb_container_port2 }}
  selector:
    app: "{{ idrac_telemetry_k8s_name }}"
---
apiVersion: apps/v1
kind: StatefulSet
metadata:
  name: {{ idrac_telemetry_k8s_name }}
  namespace: {{ telemetry_namespace }}
spec:
  podManagementPolicy: Parallel
  serviceName: {{ idrac_telemetry_service_name }}
  replicas: 1
  selector:
    matchLabels:
      app: {{ idrac_telemetry_k8s_name }}
  template:
    metadata:
      labels:
        app: {{ idrac_telemetry_k8s_name }}
    spec:
      volumes:
{% set types = hostvars['localhost']['idrac_telemetry_collection_type'].split(',') %}
{% if 'kafka' in types %}
        # Mount Kafka cluster CA certificate for TLS verification
        - name: kafka-cluster-ca-cert
          secret:
            secretName: kafka-cluster-ca-cert
            items:
              - key: ca.crt
                path: ca.crt
        # Mount kafkapump user certificates for mTLS authentication
        - name: kafkapump-user-certs
          secret:
            secretName: kafkapump
            items:
              - key: user.crt
                path: user.crt
              - key: user.key
                path: user.key
              - key: ca.crt
                path: ca.crt
{% endif %}
      hostAliases:
        - ip: "127.0.0.1"
          hostnames:
            - "mysqldb"
      terminationGracePeriodSeconds: 10
      tolerations:
      - effect: NoExecute
        key: node.kubernetes.io/not-ready
        operator: Exists
        tolerationSeconds: 5
      - effect: NoExecute
        key: node.kubernetes.io/unreachable
        operator: Exists
        tolerationSeconds: 5
      initContainers:
        # Clean up stale MySQL lock files from previous ungraceful shutdowns
        - name: cleanup-mysql-locks
          image: {{ mysql_image }}
          command:
            - /bin/sh
            - -c
            - |
              echo "Checking for stale MySQL lock files..."
              rm -f /var/lib/mysql/*.sock /var/lib/mysql/*.pid 2>/dev/null || true
              echo "Lock file cleanup complete"
          volumeMounts:
            - name: mysqldb-pvc
              mountPath: /var/lib/mysql/
      containers:
        - name: mysqldb
          image: {{ mysql_image }}
          imagePullPolicy: IfNotPresent
          volumeMounts:
            - name: mysqldb-pvc
              mountPath: /var/lib/mysql/
          lifecycle:
            preStop:
              exec:
                command: ["/bin/sh", "-c", "mysqladmin shutdown -uroot -p${MYSQL_ROOT_PASSWORD} 2>/dev/null || true"]
          env:
            - name: MYSQL_DATABASE
              value: {{ mysqldb_name }}
            - name: MYSQL_USER
              valueFrom:
                secretKeyRef:
                  name: {{ mysqldb_secrets_name }}
                  key: mysqldb_user
            - name: MYSQL_PASSWORD
              valueFrom:
                secretKeyRef:
                  name: {{ mysqldb_secrets_name }}
                  key: mysqldb_password
            - name: MYSQL_ROOT_PASSWORD
              valueFrom:
                secretKeyRef:
                  name: {{ mysqldb_secrets_name }}
                  key: mysqldb_root_password
          ports:
            - containerPort: {{ mysqldb_container_port1 }}
            - containerPort: {{ mysqldb_container_port2 }}

        - name: activemq
          image: {{ activemq_image }}
          imagePullPolicy: IfNotPresent
          ports:
            - containerPort: {{ activemq_http_port_1 }}
            - containerPort: {{ activemq_http_port_2 }}

        - name: idrac-telemetry-receiver
          image: {{ idrac_telemetry_receiver_image }}
          imagePullPolicy: IfNotPresent
          env:
            - name: MESSAGEBUS_HOST
              value: 127.0.0.1
            - name: MESSAGEBUS_PORT
              value: "{{ messagebus_http_port }}"
            - name: CONFIGUI_HTTP_PORT
              value: "{{ configui_http_port }}"
            - name: MYSQL_DATABASE
              value: {{ mysqldb_name }}
            - name: MYSQL_USER
              valueFrom:
                secretKeyRef:
                  name: {{ mysqldb_secrets_name }}
                  key: mysqldb_user
            - name: MYSQL_PASSWORD
              valueFrom:
                secretKeyRef:
                  name: {{ mysqldb_secrets_name }}
                  key: mysqldb_password
            - name: MYSQL_HOST
              value: mysqldb
            - name: MYSQL_HOST_PORT
              value: "{{ mysqldb_container_port1 }}"

{% if 'kafka' in types %}
        - name: kafka-pump
          image: {{ kafkapump_image }}
          imagePullPolicy: IfNotPresent
          volumeMounts:
            # Mount kafkapump user certificates for mTLS (under /extrabin/certs/)
            - mountPath: /extrabin/certs/kafka-certs
              name: kafkapump-user-certs
              readOnly: true
            # Mount cluster CA certificate (under /extrabin/certs/)
            - mountPath: /extrabin/certs/cluster-ca
              name: kafka-cluster-ca-cert
              readOnly: true
          env:
            - name: MESSAGEBUS_HOST
              value: 127.0.0.1
            - name: MESSAGEBUS_PORT
              value: "{{ messagebus_http_port }}"
            - name: KAFKA_BROKER
              value: "kafka-kafka-bootstrap.telemetry.svc.cluster.local:9093"
            - name: KAFKA_TOPIC
              value: "{{ kafka.topics.idrac.name }}"
            # TLS configuration - using iDRAC Telemetry Reference Tools standard env var names
            # Note: kafkapump prepends /extrabin/certs/ to these paths, so use relative paths
            - name: KAFKA_CACERT
              value: "cluster-ca/ca.crt"
            - name: KAFKA_CLIENT_CERT
              value: "kafka-certs/user.crt"
            - name: KAFKA_CLIENT_KEY
              value: "kafka-certs/user.key"
            - name: KAFKA_SKIP_VERIFY
              value: "false"
            - name: KAFKA_PARTITION
              value: "0"
{% endif %}

{% if 'victoria' in types %}
        - name: victoria-pump
          image: {{ victoriapump_image }}
          imagePullPolicy: IfNotPresent
          env:
            - name: MESSAGEBUS_HOST
              value: 127.0.0.1
            - name: MESSAGEBUS_PORT
              value: "{{ messagebus_http_port }}"
            - name: MESSAGEBUS_TYPE
              value: stomp
          ports:
            - containerPort: 2112
              name: victoriapump
{% endif %}

  volumeClaimTemplates:
    - metadata:
        name: mysqldb-pvc
      spec:
        accessModes: ["ReadWriteOnce"]
        resources:
          requests:
            storage: {{ mysqldb_storage }}


================================================
FILE: discovery/roles/telemetry/templates/telemetry/kafka/kafka.kafka.yaml.j2
================================================
apiVersion: kafka.strimzi.io/v1beta2
kind: KafkaNodePool
metadata:
  name: controller
  namespace: telemetry
  labels:
    strimzi.io/cluster: kafka
spec:
  replicas: 3
  roles:
    - controller
  storage:
    type: jbod
    volumes:
      - id: 0
        type: persistent-claim
        size: "{{ hostvars['localhost']['kafka_configurations']['persistence_size'] }}"
        kraftMetadata: shared
        deleteClaim: false
---

apiVersion: kafka.strimzi.io/v1beta2
kind: KafkaNodePool
metadata:
  name: broker
  namespace: telemetry
  labels:
    strimzi.io/cluster: kafka
spec:
  replicas: 3
  roles:
    - broker
  storage:
    type: jbod
    volumes:
      - id: 0
        type: persistent-claim
        size: "{{ hostvars['localhost']['kafka_configurations']['persistence_size'] }}"
        kraftMetadata: shared
        deleteClaim: false
---

apiVersion: kafka.strimzi.io/v1beta2
kind: Kafka
metadata:
  name: kafka
  namespace: telemetry
  annotations:
    strimzi.io/node-pools: enabled
    strimzi.io/kraft: enabled
spec:
  kafka:
    version: 4.1.0
    metadataVersion: 4.1-IV0
    listeners:
      - name: internal
        port: 9092
        type: internal
        tls: true
      - name: tls
        port: 9093
        type: internal
        tls: true
        authentication:
          type: tls
      # External listener with mTLS
      - name: external
        port: 9094
        type: loadbalancer
        tls: true
        authentication:
          type: tls
    # Enable authorization for proper access control
    authorization:
      type: simple
    config:
      offsets.topic.replication.factor: 3
      transaction.state.log.replication.factor: 3
      transaction.state.log.min.isr: 2
      default.replication.factor: 3
      min.insync.replicas: 2
      log.retention.hours: {{ hostvars['localhost']['kafka_configurations']['log_retention_hours'] }}
      log.segment.bytes: {{ hostvars['localhost']['kafka_configurations']['log_segment_bytes'] }}
      log.retention.bytes: {{ hostvars['localhost']['kafka_configurations']['log_retention_bytes'] }}
      log.retention.check.interval.ms: 300000
      # Enable topic auto-creation for external clients
      auto.create.topics.enable: true
      num.partitions: 3
  entityOperator:
    topicOperator: {}
    userOperator:
      # Allow User Operator to connect via TLS
      secretPrefix: ""
      resources:
        requests:
          memory: 512Mi
          cpu: "0.2"
        limits:
          memory: 512Mi
          cpu: "1"


================================================
FILE: discovery/roles/telemetry/templates/telemetry/kafka/kafka.kafka_bridge.yaml.j2
================================================
---
apiVersion: kafka.strimzi.io/v1beta2
kind: KafkaBridge
metadata:
  name: bridge
  namespace: telemetry
spec:
  bootstrapServers: kafka-kafka-bootstrap:9093
  enableMetrics: true
  http:
    port: 8080
  # Enable TLS for Kafka connection
  tls:
    trustedCertificates:
      - secretName: kafka-cluster-ca-cert
        certificate: ca.crt
  # Enable mTLS authentication (required for port 9093)
  authentication:
    type: tls
    certificateAndKey:
      secretName: kafkapump
      certificate: user.crt
      key: user.key
  replicas: 1


================================================
FILE: discovery/roles/telemetry/templates/telemetry/kafka/kafka.kafka_bridge_lb.yaml.j2
================================================
---
apiVersion: v1
kind: Service
metadata:
  name: bridge-bridge-lb
  namespace: telemetry
spec:
  type: LoadBalancer
  selector:
    app.kubernetes.io/name: kafka-bridge
    app.kubernetes.io/instance: bridge
  ports:
    - name: http
      port: 8080
      targetPort: 8080
      protocol: TCP


================================================
FILE: discovery/roles/telemetry/templates/telemetry/kafka/kafka.kafkapump_user.yaml.j2
================================================
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

---
apiVersion: kafka.strimzi.io/v1beta2
kind: KafkaUser
metadata:
  name: kafkapump
  namespace: {{ telemetry_namespace }}
  labels:
    strimzi.io/cluster: kafka
spec:
  authentication:
    type: tls
  authorization:
    type: simple
    acls:
      # Global topic creation and management permissions for external clients
      - resource:
          type: topic
          name: "*"
          patternType: literal
        operations:
          - Create
          - Delete
          - Describe
          - Read
          - Write
          - Alter
          - AlterConfigs
        host: "*"
      
      # Cluster-level permissions for topic management
      - resource:
          type: cluster
        operations:
          - Describe
          - Create
        host: "*"
      
      # Consumer group permissions for any group
      - resource:
          type: group
          name: "*"
          patternType: literal
        operations:
          - Read
          - Describe
        host: "*"

{% if hostvars['localhost']['idrac_telemetry_support'] and 'kafka' in hostvars['localhost']['idrac_telemetry_collection_type'].split(',') %}
      # Producer and consumer permissions for idrac topic
      - resource:
          type: topic
          name: {{ kafka.topics.idrac.name }}
          patternType: literal
        operations:
          - Read
          - Write
          - Describe
          - Create
        host: "*"
      # Consumer group permissions for idrac
      - resource:
          type: group
          name: {{ kafka.topics.idrac.consumer_group }}
          patternType: prefix
        operations:
          - Read
        host: "*"
{% endif %}
{% if hostvars['localhost']['ldms_support'] %}
      # Producer and consumer permissions for ldms topic
      - resource:
          type: topic
          name: {{ kafka.topics.ldms.name }}
          patternType: literal
        operations:
          - Read
          - Write
          - Describe
          - Create
        host: "*"
      # Consumer group permissions for ldms
      - resource:
          type: group
          name: {{ kafka.topics.ldms.consumer_group }}
          patternType: prefix
        operations:
          - Read
        host: "*"
{% endif %}
      # Cluster-level permissions for idempotent producers
      - resource:
          type: cluster
        operations:
          - IdempotentWrite
        host: "*"


================================================
FILE: discovery/roles/telemetry/templates/telemetry/kafka/kafka.tls_test_job.yaml.j2
================================================
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

---
apiVersion: v1
kind: ConfigMap
metadata:
  name: kafka-tls-test-script
  namespace: {{ telemetry_namespace }}
data:
  test-kafka-tls.sh: |
    #!/bin/bash
    set -e
    
    # Set Kafka bin path
    export PATH="/opt/kafka/bin:$PATH"
    
    echo "=========================================="
    echo "   Kafka TLS/mTLS Connection Test"
    echo "=========================================="
    echo "Bootstrap Server: kafka-kafka-bootstrap:9093"
    echo "Certificates: kafkapump (for all TLS topics)"
    echo "Testing topics based on enabled telemetry support:"
{% if hostvars['localhost']['idrac_telemetry_support'] and 'kafka' in hostvars['localhost']['idrac_telemetry_collection_type'].split(',') %}
    echo "  - iDRAC telemetry topic ({{ kafka.topics.idrac.name }})"
{% endif %}
{% if hostvars['localhost']['ldms_support'] %}
    echo "  - LDMS telemetry topic ({{ kafka.topics.ldms.name }})"
{% endif %}
    echo "Note: All topics use port 9093 with mTLS for testing"
    echo ""
    
    # Create truststore from cluster CA
    echo "Step 1: Creating Java truststore from cluster CA certificate..."
    keytool -import -trustcacerts -alias kafka-cluster-ca \
      -file /etc/kafka/cluster-ca/ca.crt \
      -keystore /tmp/truststore.jks \
      -storepass changeit -noprompt
    echo "✓ Truststore created successfully"
    echo ""
    
    # Create keystore from kafkapump client certificate (for all topics)
    echo "Step 2: Creating keystore with kafkapump client certificate..."
    openssl pkcs12 -export \
      -in /etc/kafka/kafkapump-certs/user.crt \
      -inkey /etc/kafka/kafkapump-certs/user.key \
      -out /tmp/kafkapump-keystore.p12 \
      -password pass:changeit \
      -name kafkapump
    echo "✓ kafkapump keystore created successfully"
    echo ""
    
    # Create kafka client properties file for kafkapump user
    echo "Step 3: Creating Kafka client properties..."
    echo "security.protocol=SSL" > /tmp/kafkapump-client.properties
    echo "ssl.truststore.location=/tmp/truststore.jks" >> /tmp/kafkapump-client.properties
    echo "ssl.truststore.password=changeit" >> /tmp/kafkapump-client.properties
    echo "ssl.keystore.location=/tmp/kafkapump-keystore.p12" >> /tmp/kafkapump-client.properties
    echo "ssl.keystore.password=changeit" >> /tmp/kafkapump-client.properties
    echo "ssl.keystore.type=PKCS12" >> /tmp/kafkapump-client.properties
    echo "✓ Client properties created"
    echo ""
    
    # List topics to verify TLS connection (using kafkapump user)
    echo "Step 4: Testing mTLS connection by listing topics..."
    /opt/kafka/bin/kafka-topics.sh --bootstrap-server kafka-kafka-bootstrap:9093 \
      --command-config /tmp/kafkapump-client.properties \
      --list
    echo "✓ mTLS connection successful"
    echo ""
    
{% if hostvars['localhost']['idrac_telemetry_support'] and 'kafka' in hostvars['localhost']['idrac_telemetry_collection_type'].split(',') %}
    # Test iDRAC telemetry topic consumer
    echo "Step 5: Testing consumer on {{ kafka.topics.idrac.name }} topic (kafkapump user)..."
    timeout 30 /opt/kafka/bin/kafka-console-consumer.sh \
      --bootstrap-server kafka-kafka-bootstrap:9093 \
      --topic {{ kafka.topics.idrac.name }} \
      --consumer.config /tmp/kafkapump-client.properties \
      --group {{ kafka.topics.idrac.consumer_group }} \
      --from-beginning \
      --max-messages 10 || echo "No messages or timeout (this is normal for {{ kafka.topics.idrac.name }})"
    echo ""
{% endif %}
    
{% if hostvars['localhost']['ldms_support'] %}
    # Test LDMS topic consumer
    echo "Step 6: Testing consumer on {{ kafka.topics.ldms.name }} topic (kafkapump user via TLS)..."
    timeout 30 /opt/kafka/bin/kafka-console-consumer.sh \
      --bootstrap-server kafka-kafka-bootstrap:9093 \
      --topic {{ kafka.topics.ldms.name }} \
      --consumer.config /tmp/kafkapump-client.properties \
      --group {{ kafka.topics.ldms.consumer_group }} \
      --from-beginning \
      --max-messages 10 || echo "No messages or timeout (this is normal for {{ kafka.topics.ldms.name }})"
    echo ""
{% endif %}
    
    echo ""
    echo "=== All tests completed ==="
    echo ""
    echo "Summary:"
    echo "  ✓ Truststore created (cluster CA)"
    echo "  ✓ kafkapump keystore created"
    echo "  ✓ mTLS connection established"
    echo "  ✓ Topics listed successfully"
{% if hostvars['localhost']['idrac_telemetry_support'] and 'kafka' in hostvars['localhost']['idrac_telemetry_collection_type'].split(',') %}
    echo "  ✓ {{ kafka.topics.idrac.name }} topic tested (kafkapump user)"
{% endif %}
{% if hostvars['localhost']['ldms_support'] %}
    echo "  ✓ {{ kafka.topics.ldms.name }} topic tested via TLS (kafkapump user)"
{% endif %}
    echo ""

---
apiVersion: batch/v1
kind: Job
metadata:
  name: kafka-tls-test
  namespace: {{ telemetry_namespace }}
  labels:
    app: kafka-tls-test
spec:
  ttlSecondsAfterFinished: 3600
  backoffLimit: 2
  template:
    metadata:
      labels:
        app: kafka-tls-test
    spec:
      restartPolicy: Never
      volumes:
        - name: kafka-cluster-ca-cert
          secret:
            secretName: kafka-cluster-ca-cert
        - name: kafkapump-user-certs
          secret:
            secretName: kafkapump
        - name: test-script
          configMap:
            name: kafka-tls-test-script
            defaultMode: 0755
      containers:
        - name: kafka-tls-test
          image: {{ kafka.kafka_image }}
          imagePullPolicy: IfNotPresent
          volumeMounts:
            - mountPath: /etc/kafka/cluster-ca
              name: kafka-cluster-ca-cert
              readOnly: true
            - mountPath: /etc/kafka/kafkapump-certs
              name: kafkapump-user-certs
              readOnly: true
            - mountPath: /opt/test
              name: test-script
          command: ["/bin/bash"]
          args: ["/opt/test/test-kafka-tls.sh"]


================================================
FILE: discovery/roles/telemetry/templates/telemetry/kafka/kafka.topic.yaml.j2
================================================
apiVersion: kafka.strimzi.io/v1beta2
kind: KafkaTopic
metadata:
  name: {{ topic_name }}
  namespace: {{ telemetry_namespace }}
  labels:
    strimzi.io/cluster: "kafka"
spec:
  partitions: {{ kafka_topic_partitions[topic_key] }}
  replicas: 2
  config:
    cleanup.policy: delete


================================================
FILE: discovery/roles/telemetry/templates/telemetry/kustomization.yaml.j2
================================================
resources:
  - telemetry_secret_creation.yaml
{% set types = hostvars['localhost']['idrac_telemetry_collection_type'].split(',') %}
{% if 'victoria' in types %}
  # VictoriaMetrics Common Resources
  - victoria-tls-secret.yaml
  - victoria-vmagent-rbac.yaml
  - vmagent-scrape-config.yaml
  - victoria-agent-deployment.yaml
  # VictoriaMetrics Deployment (mode: {{ hostvars['localhost']['victoria_configurations']['deployment_mode'] }})
{% if hostvars['localhost']['victoria_configurations']['deployment_mode'] == 'cluster' %}
  # Cluster Mode: High-availability deployment
  - victoria-cluster-vmstorage.yaml
  - victoria-cluster-vminsert.yaml
  - victoria-cluster-vmselect.yaml
{% else %}
  # Single-Node Mode: Simple deployment
  - victoria-statefulset.yaml
{% endif %}
  # Uncomment to deploy VictoriaMetrics TLS test job
  # - test/victoria-tls-test-job.yaml
{% endif %}
{% if kafka_support %}
  - kafka.kafka.yaml
  - kafka.kafkapump_user.yaml
{% if hostvars['localhost']['idrac_telemetry_support'] and 'kafka' in hostvars['localhost']['idrac_telemetry_collection_type'].split(',') %}
  - kafka.topic_idrac.yaml
{% endif %}
{% if hostvars['localhost']['ldms_support'] %}
  - kafka.topic_ldms.yaml
{% endif %}
  - kafka.kafka_bridge.yaml
  - kafka.kafka_bridge_lb.yaml
  # Uncomment to deploy TLS test job
  # - test/kafka.tls_test_job.yaml
{% endif %}
{% if hostvars['localhost']['idrac_telemetry_support'] %}
  - idrac_telemetry_statefulset.yaml
  - telemetry_cleaner_rbac.yaml
  - telemetry_pod_cleanup.yaml
{% endif %}

================================================
FILE: discovery/roles/telemetry/templates/telemetry/ldms/host_map.slurm-cluster.json.j2
================================================
[
{% set filtered_nodes = nodes | sort(attribute='value.XNAME') | rejectattr('value.FUNCTIONAL_GROUP_NAME', 'search', '^service_kube') | list %}
{% for item in filtered_nodes %}
    {
        "hostname": "{{ item.value.HOSTNAME }}.{{ hostvars['localhost']['domain_name'] }}",
        "hostaddr": "{{ item.value.ADMIN_IP }}",
        "ip_address": "{{ item.value.ADMIN_IP }}",
        "subrole": "Compute"
    }{% if not loop.last %},{% endif %}
{% endfor %}

]

================================================
FILE: discovery/roles/telemetry/templates/telemetry/ldms/ldms_machine_config.json.j2
================================================
{
  "sys_opts": {
    "system" : "dell",
    "namespace": "telemetry",
    "agg_port": {{ telemetry_config.ldms_agg_port }},
    "store_port": {{ telemetry_config.ldms_store_port }},
    "imagePullSecretsOption": {
      "imagePullSecrets": [
      ]
    }
  },
  "node_types": {
    "slurm-cluster": {
      "host_map_file": "out_dir/host_map.slurm-cluster.json",
      "alias": "slurm-cluster",
      "agg_count": 1,
      "store_split": 999999,
      "sampler": {
        "name": "nersc",
        "port": {{ telemetry_config.ldms_sampler_port }},
        "auth_type": "ovis",
        "auth_secret": "nersc-ldms-ovis-auth",
        "auth_secret_file": "ldmsauth.conf"
      },
      "auth_type": "munge",
      "auth_secret": "nersc-munge-key",
      "auth_secret_file": "munge.key",
      "mem": "128M"
    }
  }
}


================================================
FILE: discovery/roles/telemetry/templates/telemetry/ldms/ldmsauth.conf.j2
================================================
secretword={{ hostvars['localhost']['ldms_sampler_password'] }}


================================================
FILE: discovery/roles/telemetry/templates/telemetry/ldms/ldmsd.sampler.env.j2
================================================
# This file contains environment variables for ldmsd.sampler, which will affect
# ldmsd initial configuration (e.g. transport, named socket path)

# LDMS transport option (sock, rdma, or ugni)
LDMSD_XPRT=sock
# LDMS Daemon service port
LDMSD_PORT={{ telemetry_config.ldms_sampler_port }}

# LDMS memory allocation
LDMSD_MEM=512K

# Log verbosity
LDMSD_VERBOSE=INFO

# Log file control. The default is to log to syslog.
# LDMSD_LOG_OPTION="-l /var/log/ldmsd.log"

# Authentication method
# Use `ovis` in this example
LDMSD_AUTH_PLUGIN=ovis
# AUTH_FILE for `ovis` auth method
LDMS_AUTH_FILE=/opt/ovis-ldms/etc/ldms/ldmsauth.conf

# LDMS plugin configuration file, see /opt/ovis-ldms/etc/ldms/sampler.conf for an example
LDMSD_PLUGIN_CONFIG_FILE=/opt/ovis-ldms/etc/ldms/sampler.conf


# These are configured by configure script, no need to change.
LDMSD_PLUGIN_LIBPATH=/opt/ovis-ldms/lib/ovis-ldms
ZAP_LIBPATH=


================================================
FILE: discovery/roles/telemetry/templates/telemetry/ldms/sampler.conf.j2
================================================
# Auto-generated LDMS sampler configuration
# Sampler port: {{ telemetry_config.ldms_sampler_port }}
{% for sampler in telemetry_config.ldms_sampler_configurations %}

load name={{ sampler.plugin_name }}
config name={{ sampler.plugin_name }} producer=${HOSTNAME} instance=${HOSTNAME}/{{ sampler.plugin_name }}{% if sampler.config_parameters is defined %} {{ sampler.config_parameters }} {% endif %}

start name={{ sampler.plugin_name }}{% if sampler.activation_parameters is defined %} {{ sampler.activation_parameters }} {% endif %}

{% endfor %}


================================================
FILE: discovery/roles/telemetry/templates/telemetry/ldms/values.yaml.j2
================================================
agg:
  resources:
    limits:
      cpu: 1
      memory: 1Gi
aggs:
- conf: /ldms_conf/ldmsd.nersc-ldms-aggr.slurm-cluster-0.conf
  env: /ldms_conf/ldms-env.nersc-ldms-aggr.slurm-cluster-0.sh
  name: slurm-cluster-0
  port: {{ telemetry_config.ldms_agg_port }}
authVolMountOption:
- mountPath: /nersc-munge-key
  name: nersc-munge-key
- mountPath: /nersc-ldms-ovis-auth
  name: nersc-ldms-ovis-auth
authVolOption:
- name: nersc-munge-key
  secret:
    defaultMode: 0o400
    secretName: nersc-munge-key
- name: nersc-ldms-ovis-auth
  secret:
    defaultMode: 0o400
    secretName: nersc-ldms-ovis-auth
image:
  registry: docker.io/dellhpcomniaaisolution
  repository: /ubuntu-ldms
  tag: "1.0"
imagePullSecretsOption:
  imagePullSecrets: []
namespace: telemetry
net_atat_def: null
statefulSet:
  store:
  - name: slurm-cluster
    replicas: 1
store:
  port: {{ telemetry_config.ldms_store_port }}
  resources:
    limits:
      cpu: 1
      memory: 1Gi


================================================
FILE: discovery/roles/telemetry/templates/telemetry/victoria/gen_victoria_certs.sh.j2
================================================
#!/bin/bash
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

# Generate TLS certificates for VictoriaMetrics

set -e

CERT_DIR="{{ victoria_cert_dir }}"
CA_KEY="$CERT_DIR/ca.key"
CA_CERT="$CERT_DIR/ca.crt"
CERT_KEY="$CERT_DIR/server.key"
CERT_FILE="$CERT_DIR/server.crt"
CSR_FILE="$CERT_DIR/server.csr"
SAN_CONFIG="$CERT_DIR/san.cnf"

mkdir -p "$CERT_DIR"

# Create SAN configuration
cat > "$SAN_CONFIG" <<EOF
[req]
distinguished_name = req_distinguished_name
req_extensions = v3_req
prompt = no

[req_distinguished_name]
CN = victoria-loadbalancer.{{ telemetry_namespace }}.svc.cluster.local

[v3_req]
keyUsage = keyEncipherment, dataEncipherment
extendedKeyUsage = serverAuth
subjectAltName = @alt_names

[alt_names]
# Single-node deployment names
DNS.1 = victoria-loadbalancer
DNS.2 = victoria-loadbalancer.{{ telemetry_namespace }}
DNS.3 = victoria-loadbalancer.{{ telemetry_namespace }}.svc
DNS.4 = victoria-loadbalancer.{{ telemetry_namespace }}.svc.cluster.local
DNS.5 = victoria-metric-0
DNS.6 = victoria-metric-0.{{ telemetry_namespace }}
DNS.7 = victoria-metric-0.{{ telemetry_namespace }}.svc
DNS.8 = victoria-metric-0.{{ telemetry_namespace }}.svc.cluster.local
# Cluster deployment names
DNS.9 = vminsert
DNS.10 = vminsert.{{ telemetry_namespace }}
DNS.11 = vminsert.{{ telemetry_namespace }}.svc
DNS.12 = vminsert.{{ telemetry_namespace }}.svc.cluster.local
DNS.13 = vmselect
DNS.14 = vmselect.{{ telemetry_namespace }}
DNS.15 = vmselect.{{ telemetry_namespace }}.svc
DNS.16 = vmselect.{{ telemetry_namespace }}.svc.cluster.local
DNS.17 = vmstorage
DNS.18 = vmstorage.{{ telemetry_namespace }}
DNS.19 = vmstorage.{{ telemetry_namespace }}.svc
DNS.20 = vmstorage.{{ telemetry_namespace }}.svc.cluster.local
# VMStorage StatefulSet pods
DNS.21 = vmstorage-0.vmstorage.{{ telemetry_namespace }}.svc.cluster.local
DNS.22 = vmstorage-1.vmstorage.{{ telemetry_namespace }}.svc.cluster.local
DNS.23 = vmstorage-2.vmstorage.{{ telemetry_namespace }}.svc.cluster.local
IP.1 = 127.0.0.1
EOF

# Generate CA key
if [ ! -f "$CA_KEY" ]; then
  echo "Generating CA key..."
  openssl genrsa -out "$CA_KEY" 4096
fi

# Generate CA certificate
if [ ! -f "$CA_CERT" ]; then
  echo "Generating CA certificate..."
  openssl req -x509 -new -nodes \
    -key "$CA_KEY" \
    -out "$CA_CERT" \
    -days {{ victoria_tls_cert_days | default(3650) }} \
    -subj "/CN=VictoriaMetrics-CA"
fi

# Generate Victoria server private key
if [ ! -f "$CERT_KEY" ]; then
  echo "Generating VictoriaMetrics server key..."
  openssl genrsa -out "$CERT_KEY" 4096
fi

# Generate CSR
if [ ! -f "$CSR_FILE" ]; then
  echo "Generating certificate signing request..."
  openssl req -new -key "$CERT_KEY" \
    -out "$CSR_FILE" \
    -config "$SAN_CONFIG"
fi

# Sign certificate
if [ ! -f "$CERT_FILE" ]; then
  echo "Signing server certificate..."
  openssl x509 -req \
    -in "$CSR_FILE" \
    -CA "$CA_CERT" \
    -CAkey "$CA_KEY" \
    -CAcreateserial \
    -out "$CERT_FILE" \
    -days {{ victoria_tls_cert_days | default(3650) }} \
    -sha256 \
    -extensions v3_req \
    -extfile "$SAN_CONFIG"
fi

echo "Certificates generated successfully in $CERT_DIR"
echo "Files:"
echo "  CA Certificate: $CA_CERT"
echo "  Server Certificate: $CERT_FILE"
echo "  Server Key: $CERT_KEY"

# Verify certificate
echo ""
echo "Certificate details:"
openssl x509 -in "$CERT_FILE" -text -noout | grep -A1 "Subject:"
openssl x509 -in "$CERT_FILE" -text -noout | grep -A10 "Subject Alternative Name"


================================================
FILE: discovery/roles/telemetry/templates/telemetry/victoria/victoria-agent-deployment.yaml.j2
================================================
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

apiVersion: apps/v1
kind: Deployment
metadata:
  name: "{{ vmagent.app_name }}"
  namespace: "{{ telemetry_namespace }}"
spec:
  replicas: 1
  selector:
    matchLabels:
      app: "{{ vmagent.app_name }}"
  template:
    metadata:
      labels:
        app: "{{ vmagent.app_name }}"
    spec:
      serviceAccountName: "{{ vmagent.service_account_name }}"
      containers:
      - name: "{{ vmagent.container_name }}"
        image: "{{ vmagent.image }}"
        args:
          - -promscrape.config={{ vmagent.scrape_config_path }}
{% if victoria_cluster.enabled %}
          - -remoteWrite.url={{ vmagent.remote_write_url_cluster }}
{% if victoria_cluster.tls_enabled %}
          - -remoteWrite.tlsCAFile=/etc/victoria/certs/ca.crt
          - -remoteWrite.tlsInsecureSkipVerify=false
{% endif %}
{% else %}
          - -remoteWrite.url={{ vmagent.remote_write_url }}
          - -remoteWrite.tlsCAFile=/etc/victoria/certs/ca.crt
          - -remoteWrite.tlsInsecureSkipVerify=false
{% endif %}
        volumeMounts:
          - name: scrape-config
            mountPath: "/etc/vmagent"
          - name: victoria-tls-certs
            mountPath: "/etc/victoria/certs"
            readOnly: true
      volumes:
        - name: scrape-config
          configMap:
            name: "{{ vmagent.configmap_name }}"
        - name: victoria-tls-certs
          secret:
            secretName: victoria-tls-certs
            items:
              - key: ca.crt
                path: ca.crt


================================================
FILE: discovery/roles/telemetry/templates/telemetry/victoria/victoria-cluster-vminsert.yaml.j2
================================================
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

# VMInsert - Insert component for VictoriaMetrics cluster
# Accepts data ingestion and routes to vmstorage nodes

apiVersion: v1
kind: Service
metadata:
  name: vminsert
  namespace: {{ telemetry_namespace }}
  labels:
    app: vminsert
spec:
  type: LoadBalancer
  selector:
    app: vminsert
  ports:
    - port: 8480
      targetPort: 8480
{% if victoria_cluster.tls_enabled %}
      name: https
{% else %}
      name: http
{% endif %}
---
apiVersion: apps/v1
kind: Deployment
metadata:
  name: vminsert
  namespace: {{ telemetry_namespace }}
  labels:
    app: vminsert
spec:
  replicas: {{ victoria_cluster.vminsert.replicas }}
  selector:
    matchLabels:
      app: vminsert
  template:
    metadata:
      labels:
        app: vminsert
    spec:
      affinity:
        podAntiAffinity:
          preferredDuringSchedulingIgnoredDuringExecution:
            - weight: 100
              podAffinityTerm:
                labelSelector:
                  matchExpressions:
                    - key: app
                      operator: In
                      values:
                        - vminsert
                topologyKey: "kubernetes.io/hostname"
      terminationGracePeriodSeconds: 30
      tolerations:
        - effect: NoExecute
          key: node.kubernetes.io/not-ready
          operator: Exists
          tolerationSeconds: 5
        - effect: NoExecute
          key: node.kubernetes.io/unreachable
          operator: Exists
          tolerationSeconds: 5
{% if victoria_cluster.tls_enabled %}
      volumes:
        - name: victoria-tls-certs
          secret:
            secretName: victoria-tls-certs
            items:
              - key: tls.crt
                path: server.crt
              - key: tls.key
                path: server.key
              - key: ca.crt
                path: ca.crt
{% endif %}
      containers:
        - name: vminsert
          image: {{ victoria_cluster.vminsert.image }}
          imagePullPolicy: IfNotPresent
          args:
            - --storageNode=vmstorage-0.vmstorage.{{ telemetry_namespace }}.svc.cluster.local:8400
{% for i in range(1, victoria_cluster.vmstorage.replicas) %}
            - --storageNode=vmstorage-{{ i }}.vmstorage.{{ telemetry_namespace }}.svc.cluster.local:8400
{% endfor %}
            - --httpListenAddr=:8480
{% if victoria_cluster.tls_enabled %}
            - -tls
            - -tlsCertFile=/etc/victoria/certs/server.crt
            - -tlsKeyFile=/etc/victoria/certs/server.key
{% endif %}
            - --maxLabelsPerTimeseries=60
          ports:
            - containerPort: 8480
{% if victoria_cluster.tls_enabled %}
              name: https
{% else %}
              name: http
{% endif %}
          startupProbe:
            httpGet:
              path: /health
              port: 8480
{% if victoria_cluster.tls_enabled %}
              scheme: HTTPS
{% else %}
              scheme: HTTP
{% endif %}
            initialDelaySeconds: 10
            periodSeconds: 5
            timeoutSeconds: 3
            failureThreshold: 30
          livenessProbe:
            httpGet:
              path: /health
              port: 8480
{% if victoria_cluster.tls_enabled %}
              scheme: HTTPS
{% else %}
              scheme: HTTP
{% endif %}
            initialDelaySeconds: 30
            periodSeconds: 30
            timeoutSeconds: 5
          readinessProbe:
            httpGet:
              path: /health
              port: 8480
{% if victoria_cluster.tls_enabled %}
              scheme: HTTPS
{% else %}
              scheme: HTTP
{% endif %}
            initialDelaySeconds: 5
            periodSeconds: 15
          resources:
            requests:
              memory: {{ victoria_cluster.vminsert.resources.requests.memory }}
              cpu: {{ victoria_cluster.vminsert.resources.requests.cpu }}
            limits:
              memory: {{ victoria_cluster.vminsert.resources.limits.memory }}
              cpu: {{ victoria_cluster.vminsert.resources.limits.cpu }}
{% if victoria_cluster.tls_enabled %}
          volumeMounts:
            - name: victoria-tls-certs
              mountPath: /etc/victoria/certs
              readOnly: true
{% endif %}


================================================
FILE: discovery/roles/telemetry/templates/telemetry/victoria/victoria-cluster-vmselect.yaml.j2
================================================
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

# VMSelect - Query component for VictoriaMetrics cluster
# Performs queries against vmstorage nodes and returns results

apiVersion: v1
kind: Service
metadata:
  name: vmselect
  namespace: {{ telemetry_namespace }}
  labels:
    app: vmselect
spec:
  type: LoadBalancer
  selector:
    app: vmselect
  ports:
    - port: 8481
      targetPort: 8481
{% if victoria_cluster.tls_enabled %}
      name: https
{% else %}
      name: http
{% endif %}
---
apiVersion: apps/v1
kind: Deployment
metadata:
  name: vmselect
  namespace: {{ telemetry_namespace }}
  labels:
    app: vmselect
spec:
  replicas: {{ victoria_cluster.vmselect.replicas }}
  selector:
    matchLabels:
      app: vmselect
  template:
    metadata:
      labels:
        app: vmselect
    spec:
      affinity:
        podAntiAffinity:
          preferredDuringSchedulingIgnoredDuringExecution:
            - weight: 100
              podAffinityTerm:
                labelSelector:
                  matchExpressions:
                    - key: app
                      operator: In
                      values:
                        - vmselect
                topologyKey: "kubernetes.io/hostname"
      terminationGracePeriodSeconds: 30
      tolerations:
        - effect: NoExecute
          key: node.kubernetes.io/not-ready
          operator: Exists
          tolerationSeconds: 5
        - effect: NoExecute
          key: node.kubernetes.io/unreachable
          operator: Exists
          tolerationSeconds: 5
      volumes:
{% if victoria_cluster.tls_enabled %}
        - name: victoria-tls-certs
          secret:
            secretName: victoria-tls-certs
            items:
              - key: tls.crt
                path: server.crt
              - key: tls.key
                path: server.key
              - key: ca.crt
                path: ca.crt
{% endif %}
{% if victoria_cluster.vmselect.cache_data_path %}
        - name: cache
          emptyDir: {}
{% endif %}
      containers:
        - name: vmselect
          image: {{ victoria_cluster.vmselect.image }}
          imagePullPolicy: IfNotPresent
          args:
            - --storageNode=vmstorage-0.vmstorage.{{ telemetry_namespace }}.svc.cluster.local:8401
{% for i in range(1, victoria_cluster.vmstorage.replicas) %}
            - --storageNode=vmstorage-{{ i }}.vmstorage.{{ telemetry_namespace }}.svc.cluster.local:8401
{% endfor %}
            - --httpListenAddr=:8481
{% if victoria_cluster.tls_enabled %}
            - -tls
            - -tlsCertFile=/etc/victoria/certs/server.crt
            - -tlsKeyFile=/etc/victoria/certs/server.key
{% endif %}
            - --search.maxQueryDuration={{ victoria_cluster.vmselect.max_query_duration }}
            - --search.maxConcurrentRequests={{ victoria_cluster.vmselect.max_concurrent_requests }}
{% if victoria_cluster.vmselect.cache_data_path %}
            - --cacheDataPath=/cache
{% endif %}
          ports:
            - containerPort: 8481
{% if victoria_cluster.tls_enabled %}
              name: https
{% else %}
              name: http
{% endif %}
          livenessProbe:
            httpGet:
              path: /health
              port: 8481
{% if victoria_cluster.tls_enabled %}
              scheme: HTTPS
{% else %}
              scheme: HTTP
{% endif %}
            initialDelaySeconds: 30
            periodSeconds: 30
            timeoutSeconds: 5
          readinessProbe:
            httpGet:
              path: /health
              port: 8481
{% if victoria_cluster.tls_enabled %}
              scheme: HTTPS
{% else %}
              scheme: HTTP
{% endif %}
            initialDelaySeconds: 5
            periodSeconds: 15
          resources:
            requests:
              memory: {{ victoria_cluster.vmselect.resources.requests.memory }}
              cpu: {{ victoria_cluster.vmselect.resources.requests.cpu }}
            limits:
              memory: {{ victoria_cluster.vmselect.resources.limits.memory }}
              cpu: {{ victoria_cluster.vmselect.resources.limits.cpu }}
          volumeMounts:
{% if victoria_cluster.tls_enabled %}
            - name: victoria-tls-certs
              mountPath: /etc/victoria/certs
              readOnly: true
{% endif %}
{% if victoria_cluster.vmselect.cache_data_path %}
            - name: cache
              mountPath: /cache
{% endif %}


================================================
FILE: discovery/roles/telemetry/templates/telemetry/victoria/victoria-cluster-vmstorage.yaml.j2
================================================
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

# VMStorage - Storage component for VictoriaMetrics cluster
# Stores raw data and returns query results to vmselect

apiVersion: v1
kind: Service
metadata:
  name: vmstorage
  namespace: {{ telemetry_namespace }}
  labels:
    app: vmstorage
spec:
  clusterIP: None  # Headless service for StatefulSet
  selector:
    app: vmstorage
  ports:
    - port: 8482
      targetPort: 8482
{% if victoria_cluster.tls_enabled %}
      name: https
{% else %}
      name: http
{% endif %}
    - port: 8400
      targetPort: 8400
      name: vminsert
    - port: 8401
      targetPort: 8401
      name: vmselect
---
apiVersion: apps/v1
kind: StatefulSet
metadata:
  name: vmstorage
  namespace: {{ telemetry_namespace }}
  labels:
    app: vmstorage
spec:
  serviceName: vmstorage
  replicas: {{ victoria_cluster.vmstorage.replicas }}
  selector:
    matchLabels:
      app: vmstorage
  template:
    metadata:
      labels:
        app: vmstorage
    spec:
      affinity:
        podAntiAffinity:
          preferredDuringSchedulingIgnoredDuringExecution:
            - weight: 100
              podAffinityTerm:
                labelSelector:
                  matchExpressions:
                    - key: app
                      operator: In
                      values:
                        - vmstorage
                topologyKey: "kubernetes.io/hostname"
      terminationGracePeriodSeconds: 30
      tolerations:
        - effect: NoExecute
          key: node.kubernetes.io/not-ready
          operator: Exists
          tolerationSeconds: 5
        - effect: NoExecute
          key: node.kubernetes.io/unreachable
          operator: Exists
          tolerationSeconds: 5
{% if victoria_cluster.tls_enabled %}
      volumes:
        - name: victoria-tls-certs
          secret:
            secretName: victoria-tls-certs
            items:
              - key: tls.crt
                path: server.crt
              - key: tls.key
                path: server.key
{% endif %}
      initContainers:
        # Clean up stale VictoriaMetrics lock files from previous ungraceful shutdowns
        - name: cleanup-victoria-locks
          image: {{ victoria_cluster.vmstorage.image }}
          command:
            - /bin/sh
            - -c
            - |
              echo "Checking for stale VictoriaMetrics lock files..."
              rm -f /vmstorage-data/flock.lock 2>/dev/null || true
              echo "Lock file cleanup complete"
          volumeMounts:
            - name: vmstorage-data
              mountPath: /vmstorage-data
      containers:
        - name: vmstorage
          image: {{ victoria_cluster.vmstorage.image }}
          imagePullPolicy: IfNotPresent
          args:
            - --storageDataPath=/vmstorage-data
            - --retentionPeriod={{ hostvars['localhost']['victoria_configurations']['retention_period'] }}
            - --httpListenAddr=:8482
{% if victoria_cluster.tls_enabled %}
            - -tls
            - -tlsCertFile=/etc/victoria/certs/server.crt
            - -tlsKeyFile=/etc/victoria/certs/server.key
{% endif %}
            - --vminsertAddr=:8400
            - --vmselectAddr=:8401
{% if victoria_cluster.vmstorage.dedup_min_scrape_interval %}
            - --dedup.minScrapeInterval={{ victoria_cluster.vmstorage.dedup_min_scrape_interval }}
{% endif %}
          ports:
            - containerPort: 8482
{% if victoria_cluster.tls_enabled %}
              name: https
{% else %}
              name: http
{% endif %}
            - containerPort: 8400
              name: vminsert
            - containerPort: 8401
              name: vmselect
          livenessProbe:
            httpGet:
              path: /health
              port: 8482
{% if victoria_cluster.tls_enabled %}
              scheme: HTTPS
{% else %}
              scheme: HTTP
{% endif %}
            initialDelaySeconds: 30
            periodSeconds: 30
            timeoutSeconds: 5
          readinessProbe:
            httpGet:
              path: /health
              port: 8482
{% if victoria_cluster.tls_enabled %}
              scheme: HTTPS
{% else %}
              scheme: HTTP
{% endif %}
            initialDelaySeconds: 5
            periodSeconds: 15
          resources:
            requests:
              memory: {{ victoria_cluster.vmstorage.resources.requests.memory }}
              cpu: {{ victoria_cluster.vmstorage.resources.requests.cpu }}
            limits:
              memory: {{ victoria_cluster.vmstorage.resources.limits.memory }}
              cpu: {{ victoria_cluster.vmstorage.resources.limits.cpu }}
          volumeMounts:
            - name: vmstorage-data
              mountPath: /vmstorage-data
{% if victoria_cluster.tls_enabled %}
            - name: victoria-tls-certs
              mountPath: /etc/victoria/certs
              readOnly: true
{% endif %}
  volumeClaimTemplates:
    - metadata:
        name: vmstorage-data
      spec:
        accessModes: ["ReadWriteOnce"]
        resources:
          requests:
            storage: {{ hostvars['localhost']['victoria_configurations']['persistence_size'] }}


================================================
FILE: discovery/roles/telemetry/templates/telemetry/victoria/victoria-statefulset.yaml.j2
================================================
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.


apiVersion: v1
kind: Service
metadata:
  name: "{{ victoria.service_name }}"
  namespace: "{{ telemetry_namespace }}"
  labels:
    app: "{{ victoria.app_name }}"
spec:
  type: LoadBalancer
  selector:
    app: "{{ victoria.app_name }}"
  ports:
    - port: 8443
      targetPort: 8443
      name: https
---
apiVersion: apps/v1
kind: StatefulSet
metadata:
  name: victoria-metric
  namespace: telemetry
spec:
  podManagementPolicy: Parallel
  replicas: 1
  selector:
    matchLabels:
      app: "{{ victoria.app_name }}"
  template:
    metadata:
      labels:
        app: "{{ victoria.app_name }}"
    spec:
      affinity:
        podAntiAffinity:
          preferredDuringSchedulingIgnoredDuringExecution:
            - weight: 100
              podAffinityTerm:
                labelSelector:
                  matchExpressions:
                    - key: app
                      operator: In
                      values:
                        - {{ victoria.app_name }}
                topologyKey: "kubernetes.io/hostname"
      terminationGracePeriodSeconds: 10
      tolerations:
        - effect: NoExecute
          key: node.kubernetes.io/not-ready
          operator: Exists
          tolerationSeconds: 5
        - effect: NoExecute
          key: node.kubernetes.io/unreachable
          operator: Exists
          tolerationSeconds: 5
      volumes:
        - name: victoria-tls-certs
          secret:
            secretName: victoria-tls-certs
            items:
              - key: tls.crt
                path: server.crt
              - key: tls.key
                path: server.key
              - key: ca.crt
                path: ca.crt
      initContainers:
        # Clean up stale VictoriaMetrics lock files from previous ungraceful shutdowns
        - name: cleanup-victoria-locks
          image: "{{ victoria.image }}"
          command:
            - /bin/sh
            - -c
            - |
              echo "Checking for stale VictoriaMetrics lock files..."
              rm -f /victoria-metrics-data/flock.lock 2>/dev/null || true
              echo "Lock file cleanup complete"
          volumeMounts:
            - name: victoria-metrics-pvc
              mountPath: /victoria-metrics-data
      containers:
        - name: "{{ victoria.container_name }}"
          image: "{{ victoria.image }}"
          imagePullPolicy: IfNotPresent
          args:
            - "--selfScrapeInterval=5s"
            - "--storageDataPath=/victoria-metrics-data"
            - "--retentionPeriod={{ hostvars['localhost']['victoria_configurations']['retention_period'] }}"
            - "--httpListenAddr=:8443"
            - "-tls"
            - "-tlsCertFile=/etc/victoria/certs/server.crt"
            - "-tlsKeyFile=/etc/victoria/certs/server.key"
          ports:
            - containerPort: 8443
              name: https
          volumeMounts:
            - name: victoria-metrics-pvc
              mountPath: /victoria-metrics-data
            - name: victoria-tls-certs
              mountPath: /etc/victoria/certs
              readOnly: true

  volumeClaimTemplates:
    - metadata:
        name: victoria-metrics-pvc
      spec:
        accessModes: ["ReadWriteOnce"]
        resources:
          requests:
            storage: "{{ hostvars['localhost']['victoria_configurations']['persistence_size'] }}"


================================================
FILE: discovery/roles/telemetry/templates/telemetry/victoria/victoria-tls-secret.yaml.j2
================================================
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

apiVersion: v1
kind: Secret
metadata:
  name: victoria-tls-certs
  namespace: {{ telemetry_namespace }}
type: kubernetes.io/tls
data:
  tls.crt: {{ victoria_server_cert_b64 }}
  tls.key: {{ victoria_server_key_b64 }}
  ca.crt: {{ victoria_ca_cert_b64 }}


================================================
FILE: discovery/roles/telemetry/templates/telemetry/victoria/victoria-tls-test-job.yaml.j2
================================================
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

---
apiVersion: v1
kind: ConfigMap
metadata:
  name: victoria-tls-test-script
  namespace: {{ telemetry_namespace }}
data:
  test-victoria-tls.sh: |
    #!/bin/bash
    set -e
    
    echo "=========================================="
    echo "   VictoriaMetrics TLS Connection Test"
    echo "=========================================="
{% if hostvars['localhost']['victoria_configurations']['deployment_mode'] == 'cluster' %}
    echo "Deployment Mode: Cluster"
{% if victoria_cluster.tls_enabled %}
    echo "VictoriaMetrics URL: https://vmselect:8481"
    echo "Testing with CA certificate verification"
    VICTORIA_URL="https://vmselect:8481"
    CA_CERT="/etc/victoria/certs/ca.crt"
    USE_TLS="true"
{% else %}
    echo "VictoriaMetrics URL: http://vmselect:8481"
    echo "Testing cluster without TLS (HTTP)"
    VICTORIA_URL="http://vmselect:8481"
    CA_CERT=""
    USE_TLS="false"
{% endif %}
{% else %}
    echo "Deployment Mode: Single-Node"
    echo "VictoriaMetrics URL: https://victoria-loadbalancer:8443"
    echo "Testing with CA certificate verification"
    VICTORIA_URL="https://victoria-loadbalancer:8443"
    CA_CERT="/etc/victoria/certs/ca.crt"
    USE_TLS="true"
{% endif %}
    echo ""
    
    # Set variables based on deployment mode
    # VICTORIA_URL and CA_CERT already set above
    
    # Test 1: Verify CA certificate exists (only for TLS)
    if [ "$USE_TLS" = "true" ]; then
      echo "Step 1: Verifying CA certificate..."
      if [ -f "$CA_CERT" ]; then
        echo "✓ CA certificate found at $CA_CERT"
        if command -v openssl > /dev/null 2>&1; then
          echo "Certificate details:"
          openssl x509 -in "$CA_CERT" -noout -subject -issuer -dates 2>/dev/null | sed 's/^/  /' || echo "  (Certificate details not available)"
        fi
      else
        echo "✗ CA certificate not found!"
        exit 1
      fi
      echo ""
    else
      echo "Step 1: Skipping certificate verification (TLS not enabled)"
      echo ""
    fi
    
    # Test 2: Test connection
    if [ "$USE_TLS" = "true" ]; then
      echo "Step 2: Testing HTTPS connection to VictoriaMetrics..."
      if curl -s --max-time 30 --cacert "$CA_CERT" "${VICTORIA_URL}/health" > /dev/null; then
        echo "✓ TLS connection successful"
      else
        echo "✗ TLS connection failed!"
        exit 1
      fi
    else
      echo "Step 2: Testing HTTP connection to VictoriaMetrics..."
      if curl -s --max-time 30 "${VICTORIA_URL}/health" > /dev/null; then
        echo "✓ HTTP connection successful"
      else
        echo "✗ HTTP connection failed!"
        exit 1
      fi
    fi
    echo ""
    
    # Test 3: Test health endpoint
    echo "Step 3: Testing /health endpoint..."
    if [ "$USE_TLS" = "true" ]; then
      HEALTH_RESPONSE=$(curl -s --max-time 30 --cacert "$CA_CERT" "${VICTORIA_URL}/health")
    else
      HEALTH_RESPONSE=$(curl -s --max-time 30 "${VICTORIA_URL}/health")
    fi
    echo "Health status: $HEALTH_RESPONSE"
    if [ -n "$HEALTH_RESPONSE" ]; then
      echo "✓ Health endpoint responding"
    else
      echo "✗ Health endpoint not responding!"
      exit 1
    fi
    echo ""
    
    # Test 4: Test metrics endpoint
    echo "Step 4: Testing /metrics endpoint..."
    if [ "$USE_TLS" = "true" ]; then
      METRICS_COUNT=$(curl -s --max-time 30 --cacert "$CA_CERT" "${VICTORIA_URL}/metrics" | grep -c "^vm_" || true)
    else
      METRICS_COUNT=$(curl -s --max-time 30 "${VICTORIA_URL}/metrics" | grep -c "^vm_" || true)
    fi
    echo "Found $METRICS_COUNT VictoriaMetrics metrics"
    if [ "$METRICS_COUNT" -gt 0 ]; then
      echo "✓ Metrics endpoint responding with VictoriaMetrics metrics"
    else
      echo "⚠ Metrics endpoint may not be fully initialized (this is normal on fresh install)"
    fi
    echo ""
    
    # Test 5: Test API query endpoint
{% if hostvars['localhost']['victoria_configurations']['deployment_mode'] == 'cluster' %}
    echo "Step 5: Testing /select/0/prometheus/api/v1/query endpoint..."
    if [ "$USE_TLS" = "true" ]; then
      QUERY_RESPONSE=$(curl -s --max-time 30 --cacert "$CA_CERT" "${VICTORIA_URL}/select/0/prometheus/api/v1/query?query=up" || echo "failed")
    else
      QUERY_RESPONSE=$(curl -s --max-time 30 "${VICTORIA_URL}/select/0/prometheus/api/v1/query?query=up" || echo "failed")
    fi
    if echo "$QUERY_RESPONSE" | grep -q "status"; then
      echo "Query response:"
      echo "$QUERY_RESPONSE" | head -n 5 | sed 's/^/  /'
      echo "✓ API query endpoint responding"
    else
      echo "⚠ API query endpoint returned unexpected response (this is normal if no data ingested yet)"
      echo "Response: $QUERY_RESPONSE"
    fi
    echo ""
    
    # Test 5.1: List all available metric names
    echo "Step 5.1: Listing all available metric names..."
    if [ "$USE_TLS" = "true" ]; then
      METRIC_NAMES=$(curl -s --max-time 30 --cacert "$CA_CERT" "${VICTORIA_URL}/select/0/prometheus/api/v1/label/__name__/values" || echo "failed")
    else
      METRIC_NAMES=$(curl -s --max-time 30 "${VICTORIA_URL}/select/0/prometheus/api/v1/label/__name__/values" || echo "failed")
    fi
    
    if echo "$METRIC_NAMES" | grep -q "status"; then
      METRIC_COUNT=$(echo "$METRIC_NAMES" | grep -o '"[^"]*"' | wc -l || echo "0")
      echo "Found $METRIC_COUNT unique metric names:"
      echo "$METRIC_NAMES" | grep -o '"[^"]*"' | sed 's/"//g' | head -20 | sed 's/^/  /'
      if [ "$METRIC_COUNT" -gt 20 ]; then
        echo "  ... and $((METRIC_COUNT - 20)) more metrics"
      fi
      echo "✓ Metric names endpoint responding"
    else
      echo "⚠ No metrics found or endpoint not responding"
      echo "Response: $METRIC_NAMES"
    fi
    echo ""
    
    # Test 5.2: Query specific known metrics with data
    echo "Step 5.2: Testing specific telemetry metrics..."
    
    # Test PowerEdge CPU Temperature (known working metric)
    echo "Testing PowerEdge CPU Temperature..."
    if [ "$USE_TLS" = "true" ]; then
      TEMP_METRICS=$(curl -s --max-time 30 --cacert "$CA_CERT" "${VICTORIA_URL}/select/0/prometheus/api/v1/query?query=PowerEdge_CPU1Temp_TemperatureReading" || echo "failed")
    else
      TEMP_METRICS=$(curl -s --max-time 30 "${VICTORIA_URL}/select/0/prometheus/api/v1/query?query=PowerEdge_CPU1Temp_TemperatureReading" || echo "failed")
    fi
    
    if echo "$TEMP_METRICS" | grep -q "status.*success"; then
      TEMP_COUNT=$(echo "$TEMP_METRICS" | grep -o '"metric":{[^}]*}' | wc -l || echo "0")
      echo "  Found $TEMP_COUNT CPU temperature readings:"
      if [ "$TEMP_COUNT" -gt 0 ]; then
        echo "$TEMP_METRICS" | grep -o '"HostName":"[^"]*"' | sed 's/"HostName":"//g; s/"//g' | sed 's/^/    Server: /'
        echo "$TEMP_METRICS" | grep -o '"value":\[[^]]*\]' | sed 's/"value":\[//g; s/\]//g' | sed 's/^/    Temperature: /' | sed 's/,/°C at timestamp /'
        echo "  ✓ PowerEdge temperature metrics active"
      else
        echo "  ⚠ No temperature data found"
      fi
    else
      echo "  ⚠ Could not query temperature metrics"
    fi
    echo ""
    
    # Test 'up' metric (service discovery)
    echo "Testing service discovery metrics..."
    if [ "$USE_TLS" = "true" ]; then
      UP_METRICS=$(curl -s --max-time 30 --cacert "$CA_CERT" "${VICTORIA_URL}/select/0/prometheus/api/v1/query?query=up" || echo "failed")
    else
      UP_METRICS=$(curl -s --max-time 30 "${VICTORIA_URL}/select/0/prometheus/api/v1/query?query=up" || echo "failed")
    fi
    
    if echo "$UP_METRICS" | grep -q "status.*success"; then
      UP_COUNT=$(echo "$UP_METRICS" | grep -o '"metric":{[^}]*}' | wc -l || echo "0")
      echo "  Found $UP_COUNT active targets:"
      if [ "$UP_COUNT" -gt 0 ]; then
        echo "$UP_METRICS" | grep -o '"job":"[^"]*"' | sed 's/"job":"//g; s/"//g' | sort | uniq | sed 's/^/    Job: /'
        echo "  ✓ Service discovery metrics active"
      else
        echo "  ⚠ No service discovery data found"
      fi
    else
      echo "  ⚠ Could not query service discovery metrics"
    fi
    echo ""
{% else %}
    echo "Step 5: Testing /api/v1/query endpoint..."
    if [ "$USE_TLS" = "true" ]; then
      QUERY_RESPONSE=$(curl -s --max-time 30 --cacert "$CA_CERT" "${VICTORIA_URL}/api/v1/query?query=up" || echo "failed")
    else
      QUERY_RESPONSE=$(curl -s --max-time 30 "${VICTORIA_URL}/api/v1/query?query=up" || echo "failed")
    fi
    if echo "$QUERY_RESPONSE" | grep -q "status"; then
      echo "Query response:"
      echo "$QUERY_RESPONSE" | head -n 5 | sed 's/^/  /'
      echo "✓ API query endpoint responding"
    else
      echo "⚠ API query endpoint returned unexpected response (this is normal if no data ingested yet)"
    fi
    echo ""
    
    # Test 5.1: List all available metric names
    echo "Step 5.1: Listing all available metric names..."
    if [ "$USE_TLS" = "true" ]; then
      METRIC_NAMES=$(curl -s --max-time 30 --cacert "$CA_CERT" "${VICTORIA_URL}/api/v1/label/__name__/values" || echo "failed")
    else
      METRIC_NAMES=$(curl -s --max-time 30 "${VICTORIA_URL}/api/v1/label/__name__/values" || echo "failed")
    fi
    
    if echo "$METRIC_NAMES" | grep -q "status"; then
      METRIC_COUNT=$(echo "$METRIC_NAMES" | grep -o '"[^"]*"' | wc -l || echo "0")
      echo "Found $METRIC_COUNT unique metric names:"
      echo "$METRIC_NAMES" | grep -o '"[^"]*"' | sed 's/"//g' | head -20 | sed 's/^/  /'
      if [ "$METRIC_COUNT" -gt 20 ]; then
        echo "  ... and $((METRIC_COUNT - 20)) more metrics"
      fi
      echo "✓ Metric names endpoint responding"
    else
      echo "⚠ No metrics found or endpoint not responding"
      echo "Response: $METRIC_NAMES"
    fi
    echo ""
    
    # Test 5.2: Query specific known metrics with data
    echo "Step 5.2: Testing specific telemetry metrics..."
    
    # Test PowerEdge CPU Temperature (known working metric)
    echo "Testing PowerEdge CPU Temperature..."
    if [ "$USE_TLS" = "true" ]; then
      TEMP_METRICS=$(curl -s --max-time 30 --cacert "$CA_CERT" "${VICTORIA_URL}/api/v1/query?query=PowerEdge_CPU1Temp_TemperatureReading" || echo "failed")
    else
      TEMP_METRICS=$(curl -s --max-time 30 "${VICTORIA_URL}/api/v1/query?query=PowerEdge_CPU1Temp_TemperatureReading" || echo "failed")
    fi
    
    if echo "$TEMP_METRICS" | grep -q "status.*success"; then
      TEMP_COUNT=$(echo "$TEMP_METRICS" | grep -o '"metric":{[^}]*}' | wc -l || echo "0")
      echo "  Found $TEMP_COUNT CPU temperature readings:"
      if [ "$TEMP_COUNT" -gt 0 ]; then
        echo "$TEMP_METRICS" | grep -o '"HostName":"[^"]*"' | sed 's/"HostName":"//g; s/"//g' | sed 's/^/    Server: /'
        echo "$TEMP_METRICS" | grep -o '"value":\[[^]]*\]' | sed 's/"value":\[//g; s/\]//g' | sed 's/^/    Temperature: /' | sed 's/,/°C at timestamp /'
        echo "  ✓ PowerEdge temperature metrics active"
      else
        echo "  ⚠ No temperature data found"
      fi
    else
      echo "  ⚠ Could not query temperature metrics"
    fi
    echo ""
    
    # Test 'up' metric (service discovery)
    echo "Testing service discovery metrics..."
    if [ "$USE_TLS" = "true" ]; then
      UP_METRICS=$(curl -s --max-time 30 --cacert "$CA_CERT" "${VICTORIA_URL}/api/v1/query?query=up" || echo "failed")
    else
      UP_METRICS=$(curl -s --max-time 30 "${VICTORIA_URL}/api/v1/query?query=up" || echo "failed")
    fi
    
    if echo "$UP_METRICS" | grep -q "status.*success"; then
      UP_COUNT=$(echo "$UP_METRICS" | grep -o '"metric":{[^}]*}' | wc -l || echo "0")
      echo "  Found $UP_COUNT active targets:"
      if [ "$UP_COUNT" -gt 0 ]; then
        echo "$UP_METRICS" | grep -o '"job":"[^"]*"' | sed 's/"job":"//g; s/"//g' | sort | uniq | sed 's/^/    Job: /'
        echo "  ✓ Service discovery metrics active"
      else
        echo "  ⚠ No service discovery data found"
      fi
    else
      echo "  ⚠ Could not query service discovery metrics"
    fi
    echo ""
{% endif %}
    
    # Test 6: Test certificate verification (only for TLS)
    if [ "$USE_TLS" = "true" ]; then
      echo "Step 6: Testing certificate verification (should fail without CA)..."
      if curl -s --max-time 30 -k "${VICTORIA_URL}/health" > /dev/null 2>&1; then
        echo "✓ Server requires proper certificate (insecure access blocked)"
      else
        echo "⚠ Could not test insecure connection"
      fi
      echo ""
    else
      echo "Step 6: Skipping certificate verification test (TLS not enabled)"
      echo ""
    fi
    
    # Test 7: Check certificate details from server (only for TLS)
    if [ "$USE_TLS" = "true" ]; then
      echo "Step 7: Checking server certificate details..."
      if command -v openssl > /dev/null 2>&1; then
{% if hostvars['localhost']['victoria_configurations']['deployment_mode'] == 'cluster' %}
        echo | openssl s_client -connect vmselect:8481 -CAfile "$CA_CERT" 2>/dev/null | \
          openssl x509 -noout -subject -issuer -dates 2>/dev/null | sed 's/^/  /' || \
          echo "  ⚠ Could not retrieve server certificate details"
{% else %}
        echo | openssl s_client -connect victoria-loadbalancer:8443 -CAfile "$CA_CERT" 2>/dev/null | \
          openssl x509 -noout -subject -issuer -dates 2>/dev/null | sed 's/^/  /' || \
          echo "  ⚠ Could not retrieve server certificate details"
{% endif %}
      else
        echo "  ℹ OpenSSL not available (certificate details skipped, but curl validated TLS successfully)"
      fi
      echo ""
    else
      echo "Step 7: Skipping server certificate check (TLS not enabled)"
      echo ""
    fi
    
    echo "=== All tests completed ==="
    echo ""
    echo "Summary:"
    if [ "$USE_TLS" = "true" ]; then
      echo "  ✓ CA certificate verified"
      echo "  ✓ TLS connection established"
      echo "  ✓ /health endpoint tested"
      echo "  ✓ /metrics endpoint tested"
      echo "  ✓ /api/v1/query endpoint tested"
      echo "  ✓ Certificate verification enforced"
      echo "  ✓ Server certificate validated"
      echo ""
      echo "VictoriaMetrics TLS is configured correctly!"
    else
      echo "  ✓ HTTP connection established"
      echo "  ✓ /health endpoint tested"
      echo "  ✓ /metrics endpoint tested"
      echo "  ✓ /api/v1/query endpoint tested"
      echo ""
      echo "VictoriaMetrics (without TLS) is configured correctly!"
    fi

---
apiVersion: batch/v1
kind: Job
metadata:
  name: victoria-tls-test
  namespace: {{ telemetry_namespace }}
  labels:
    app: victoria-tls-test
spec:
  ttlSecondsAfterFinished: 3600
  backoffLimit: 2
  template:
    metadata:
      labels:
        app: victoria-tls-test
    spec:
      restartPolicy: Never
      volumes:
{% if hostvars['localhost']['victoria_configurations']['deployment_mode'] == 'single-node' or victoria_cluster.tls_enabled %}
        - name: victoria-tls-certs
          secret:
            secretName: victoria-tls-certs
{% endif %}
        - name: test-script
          configMap:
            name: victoria-tls-test-script
            defaultMode: 0755
      containers:
        - name: victoria-tls-test
          image: curlimages/curl:8.17.0
          imagePullPolicy: IfNotPresent
          volumeMounts:
{% if hostvars['localhost']['victoria_configurations']['deployment_mode'] == 'single-node' or victoria_cluster.tls_enabled %}
            - mountPath: /etc/victoria/certs
              name: victoria-tls-certs
              readOnly: true
{% endif %}
            - mountPath: /opt/test
              name: test-script
          command: ["/bin/sh"]
          args: ["/opt/test/test-victoria-tls.sh"]


================================================
FILE: discovery/roles/telemetry/templates/telemetry/victoria/victoria-vmagent-rbac.yaml.j2
================================================
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

apiVersion: v1
kind: ServiceAccount
metadata:
  name: "{{ vmagent.service_account_name }}"
  namespace: "{{ telemetry_namespace }}"
---
apiVersion: rbac.authorization.k8s.io/v1
kind: Role
metadata:
  name: "{{ vmagent.role_name }}"
  namespace: "{{ telemetry_namespace }}"
rules:
  - apiGroups: [""]
    resources: ["pods", "services", "endpoints"]
    verbs: ["get", "list", "watch"]
---
apiVersion: rbac.authorization.k8s.io/v1
kind: RoleBinding
metadata:
  name: "{{ vmagent.rolebinding_name }}"
  namespace: "{{ telemetry_namespace }}"
subjects:
  - kind: ServiceAccount
    name: "{{ vmagent.service_account_name }}"
    namespace: "{{ telemetry_namespace }}"
roleRef:
  kind: Role
  name: "{{ vmagent.role_name }}"
  apiGroup: rbac.authorization.k8s.io

================================================
FILE: discovery/roles/telemetry/templates/telemetry/victoria/vmagent-scrape-config.yaml.j2
================================================
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

apiVersion: v1
kind: ConfigMap
metadata:
  name: "{{ vmagent.configmap_name }}"
  namespace: "{{ telemetry_namespace }}"
data:
  prometheus.yml: |
    global:
      scrape_interval: {{ vmagent.global.scrape_interval }}

    scrape_configs:
      - job_name: "{{ vmagent.job_name }}"
        honor_labels: true

        kubernetes_sd_configs:
          - role: pod
            namespaces:
              names:
                - {{ vmagent.kubernetes_sd_namespace }}

        relabel_configs:

          # Keep only pods with correct label
          - source_labels: [__meta_kubernetes_pod_label_app]
            regex: {{ vmagent.target_pod_label }}
            action: keep

          # Keep only the metrics container
          - source_labels: [__meta_kubernetes_pod_container_name]
            regex: {{ vmagent.metrics_container_name }}
            action: keep

          # Set actual scrape address (container port)
          - source_labels: [__meta_kubernetes_pod_ip]
            target_label: __address__
            replacement: "$1:{{ vmagent.metrics_port }}"

          # Unique instance using pod name
          - source_labels: [__meta_kubernetes_pod_name]
            target_label: instance

          # Add namespace label
          - source_labels: [__meta_kubernetes_namespace]
            target_label: namespace

          # Add Pod IP label
          - source_labels: [__meta_kubernetes_pod_ip]
            target_label: pod_ip

================================================
FILE: discovery/roles/telemetry/vars/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# Usage: generate_service_cluster_metadata.yml
functional_groups_config_path: "{{ hostvars['localhost']['functional_groups_config_path'] }}"
functional_groups_config_syntax_fail_msg: "Failed. Syntax errors present in functional_groups_config.yml. Fix errors and re-run playbook again."
service_cluster_metadata_path: "/opt/omnia/.data/service_cluster_metadata.yml"
metadata_perm: "0644"

# Usage: read_software_config.yml
k8s_packages_file: "{{ input_project_dir }}/config/x86_64/{{ software_config.cluster_os_type }}/{{ software_config.cluster_os_version }}/service_k8s.json"

# Usage: secrets_creation.yml
mysqldb_secrets_name: mysqldb-credentials

# Usage: idrac_telemetry_deployment.yml
service_cluster_idrac_telemetry_dir_path: "{{ hostvars['localhost']['k8s_client_share_path'] }}/idrac_telemetry"
dir_permissions_755: "0755"
telemetry_namespace: "telemetry"
idrac_telemetry_k8s_name: idrac-telemetry

# iDRAC Telemetry scripting repository
idrac_telemetry_scripting_src_path: "{{ oim_shared_path }}/omnia/telemetry/iDRAC-Telemetry-Scripting"
idrac_telemetry_scripting_git_clone_path: "{{ service_cluster_idrac_telemetry_dir_path }}/iDRAC-Telemetry-Scripting"
idrac_telemetry_scripting_copy_fail_msg: |
  Failed to copy iDRAC Telemetry Scripting from {{ idrac_telemetry_scripting_src_path }}
  to {{ idrac_telemetry_scripting_git_clone_path }}. Please ensure prepare_oim.yml has been
  executed successfully before running discovery.

# Pre-built container images for iDRAC telemetry components
# These default to your published images but can be overridden via telemetry_images
idrac_telemetry_receiver_image: "{{ telemetry_images['dellhpcomniaaisolution/idrac_telemetry_receiver'] | default('docker.io/dellhpcomniaaisolution/idrac_telemetry_receiver:1.2') }}" # noqa: yaml[line-length]
kafkapump_image: "{{ telemetry_images['dellhpcomniaaisolution/kafkapump'] | default('docker.io/dellhpcomniaaisolution/kafkapump:1.2') }}"
victoriapump_image: "{{ telemetry_images['dellhpcomniaaisolution/victoriapump'] | default('docker.io/dellhpcomniaaisolution/victoriapump:1.2') }}"

activemq_image: "{{ telemetry_images['rmohr/activemq'] | default('docker.io/rmohr/activemq:5.15.9') }}"
activemq_http_port_1: 8161
activemq_http_port_2: 61616
messagebus_http_port: 61613
configui_http_port: 8082
mysqldb_storage: 1Gi
mysqldb_pvc_name: mysqldb-storage-claim
mysqldb_k8s_name: mysqldb
mysqldb_name: "idrac_telemetrydb"
idrac_telemetry_service_name: "idrac-telemetry-service"
mysqldb_container_port1: 3306
mysqldb_container_port2: 33060
mysql_image: "{{ telemetry_images['library/mysql'] | default('docker.io/library/mysql:9.3.0') }}"
pod_wait_timeout: "10m"
kafka_skip_verify: true

# Usage: kafka_deployment.yml
kafka:
  app_name: "kafka"
  container_name: "kafka-controller"
  service_name: "kafka-headless"
  lb_service_name: "kafka-loadbalancer"
  container_port1: 9093
  # Kafka images from service_k8s.json
  operator_image: "{{ telemetry_images['strimzi/operator'] | default('quay.io/strimzi/operator:0.48.0') }}"
  kafka_image: "{{ telemetry_images['strimzi/kafka'] | default('quay.io/strimzi/kafka:0.48.0-kafka-4.1.0') }}"
  bridge_image: "{{ telemetry_images['strimzi/kafka-bridge'] | default('quay.io/strimzi/kafka-bridge:0.33.1') }}"
  container_port2: 9093
  image: "apache/kafka:4.1.0"
  cluster_id: "kafka-cluster-id"

  # Kafka topic names (FIXED - cannot be changed)
  topics:
    idrac:
      name: "idrac"
      consumer_group: "idrac-consumer-group"
    ldms:
      name: "ldms"
      consumer_group: "ldms-consumer-group"

# Dynamic image configuration from service_k8s.json
# Images and versions are read dynamically from input/config/x86_64/rhel/10.0/service_k8s.json
telemetry_images: "{{ service_k8s_images | default({}) }}"

# Usage: victoriametric_deployment.yml
# Single-node VictoriaMetrics (deprecated - use cluster mode)
victoria:
  app_name: "victoriametrics"
  container_name: "victoriametrics"
  service_name: "victoria-loadbalancer"
  container_port: 8443
  image: "{{ telemetry_images['victoriametrics/victoria-metrics'] | default('victoriametrics/victoria-metrics:v1.128.0') }}"

# VictoriaMetrics Cluster Configuration
# Deployment mode is controlled by victoria_configurations.deployment_mode in telemetry_config.yml
# Supported modes: "single-node" or "cluster"
victoria_cluster:
  # Auto-configured based on telemetry_config.yml
  # true = cluster mode, false = single-node mode
  enabled: "{{ true if hostvars['localhost']['victoria_configurations']['deployment_mode'] == 'cluster' else false }}"
  tls_enabled: true   # Set to true to enable TLS for cluster components
  # VMStorage: Stores raw data and returns query results
  vmstorage:
    replicas: 3
    image: "{{ telemetry_images['victoriametrics/vmstorage'] | default('victoriametrics/vmstorage:v1.128.0-cluster') }}"
    dedup_min_scrape_interval: "1m"  # Deduplication interval
    resources:
      requests:
        memory: "2Gi"
        cpu: "500m"
      limits:
        memory: "4Gi"
        cpu: "2000m"
  # VMInsert: Accepts data ingestion and routes to vmstorage
  vminsert:
    replicas: 2
    image: "{{ telemetry_images['victoriametrics/vminsert'] | default('victoriametrics/vminsert:v1.128.0-cluster') }}"
    # External access configuration
    external_access: true  # Enable LoadBalancer service for external data ingestion
    resources:
      requests:
        memory: "512Mi"
        cpu: "250m"
      limits:
        memory: "1Gi"
        cpu: "1000m"
  # VMSelect: Performs queries against vmstorage nodes
  vmselect:
    replicas: 2
    image: "{{ telemetry_images['victoriametrics/vmselect'] | default('victoriametrics/vmselect:v1.128.0-cluster') }}"
    max_query_duration: "5m"
    max_concurrent_requests: "8"
    cache_data_path: true  # Enable query result caching
    resources:
      requests:
        memory: "512Mi"
        cpu: "250m"
      limits:
        memory: "1Gi"
        cpu: "1000m"

# Telemetry shared path configuration
telemetry_share_path: "{{ hostvars['localhost']['oim_shared_path'] }}/omnia/telemetry"

# VictoriaMetrics TLS Configuration
victoria_tls_cert_days: 3650
victoria_cert_dir: "{{ telemetry_share_path }}/victoria-certs"

# Usage: vmagent-scrape-config.yaml
vmagent:
  configmap_name: "vmagent-scrape-config"
  global:
    scrape_interval: "10s"
  job_name: "idrac-telemetry"
  kubernetes_sd_namespace: "{{ telemetry_namespace }}"
  target_pod_label: "{{ idrac_telemetry_k8s_name }}"
  metrics_container_name: "victoria-pump"
  metrics_port: 2112
  service_account_name: "vmagent"
  role_name: "vmagent-sd"
  rolebinding_name: "vmagent-sd-binding"
  app_name: "vmagent"
  container_name: "vmagent"
  image: "{{ telemetry_images['victoriametrics/vmagent'] | default('victoriametrics/vmagent:v1.128.0') }}"
  scrape_config_path: "/etc/vmagent/prometheus.yml"
  # Single-node URL
  remote_write_url: "https://victoria-loadbalancer.telemetry.svc.cluster.local:8443/api/v1/write"
  # Cluster URL (used when victoria_cluster.enabled: true)
  remote_write_url_cluster: >
    {% if victoria_cluster.tls_enabled %}https{% else %}
    http{% endif %}://vminsert.{{ telemetry_namespace }}.svc.cluster.local:8480/insert/0/prometheus/api/v1/write

strmzi_kafka_tarball_url: "{{ offline_tarball_path }}/{{ strimzi_kafka_pkg }}/{{ strimzi_kafka_pkg }}.tar.gz"

# Usage: validate_idrac_inventory.yml
bmc_group_data_filename: "/opt/omnia/telemetry/bmc_group_data.csv"
bmc_group_data_headers: "BMC_IP,GROUP_NAME,PARENT"
openchami_work_dir: "{{ hostvars['localhost']['oim_shared_path'] }}/omnia/openchami/workdir"
nodes_dir: "{{ openchami_work_dir }}/nodes"
openchami_nodes_vars_path: "{{ nodes_dir }}/nodes.yaml"

# Usage: update_ldms_sampler.yml
telemetry_config_file_path: "{{ hostvars['localhost']['input_project_dir'] }}/telemetry_config.yml"
common_mode: "0755"

# Usage: generate_telemetry_deployments.yml - Template lists for different components
# Victoria templates - conditional based on victoria_cluster.enabled
victoria_templates_common:
  - src: 'telemetry/victoria/victoria-tls-secret.yaml.j2'
    dest: 'victoria-tls-secret.yaml'
  - src: 'telemetry/victoria/victoria-vmagent-rbac.yaml.j2'
    dest: 'victoria-vmagent-rbac.yaml'
  - src: 'telemetry/victoria/vmagent-scrape-config.yaml.j2'
    dest: 'vmagent-scrape-config.yaml'
  - src: 'telemetry/victoria/victoria-agent-deployment.yaml.j2'
    dest: 'victoria-agent-deployment.yaml'

idrac_telemetry_statefulset_path: "{{ hostvars['localhost']['k8s_client_share_path'] }}/telemetry/deployments/idrac_telemetry_statefulset.yaml"

# Single-node templates (used when victoria_cluster.enabled: false)
victoria_templates_single:
  - src: 'telemetry/victoria/victoria-statefulset.yaml.j2'
    dest: 'victoria-statefulset.yaml'

# Cluster templates (used when victoria_cluster.enabled: true)
victoria_templates_cluster:
  - src: 'telemetry/victoria/victoria-cluster-vmstorage.yaml.j2'
    dest: 'victoria-cluster-vmstorage.yaml'
  - src: 'telemetry/victoria/victoria-cluster-vminsert.yaml.j2'
    dest: 'victoria-cluster-vminsert.yaml'
  - src: 'telemetry/victoria/victoria-cluster-vmselect.yaml.j2'
    dest: 'victoria-cluster-vmselect.yaml'

# Test job template (optional)
victoria_templates_test:
  - src: 'telemetry/victoria/victoria-tls-test-job.yaml.j2'
    dest: 'test/victoria-tls-test-job.yaml'

# Combined victoria_templates for backward compatibility
# Note: victoria_templates_test is commented out by default in kustomization.yaml.j2
victoria_templates: >
  {{ victoria_templates_common +
     (victoria_templates_cluster if victoria_cluster.enabled else victoria_templates_single) +
     victoria_templates_test }}

kafka_templates:
  - src: 'telemetry/kafka/kafka.kafka.yaml.j2'
    dest: 'kafka.kafka.yaml'
  - src: 'telemetry/kafka/kafka.kafkapump_user.yaml.j2'
    dest: 'kafka.kafkapump_user.yaml'
  - src: 'telemetry/kafka/kafka.kafka_bridge.yaml.j2'
    dest: 'kafka.kafka_bridge.yaml'
  - src: 'telemetry/kafka/kafka.kafka_bridge_lb.yaml.j2'
    dest: 'kafka.kafka_bridge_lb.yaml'
  - src: 'telemetry/kafka/kafka.tls_test_job.yaml.j2'
    dest: 'test/kafka.tls_test_job.yaml'

common_templates:
  - src: 'telemetry/common/telemetry_cleaner_rbac.yaml.j2'
    dest: 'telemetry_cleaner_rbac.yaml'
  - src: 'telemetry/common/telemetry_pod_cleanup.yaml.j2'
    dest: 'telemetry_pod_cleanup.yaml'
  - src: 'telemetry/common/telemetry_namespace_creation.yaml.j2'
    dest: 'telemetry_namespace_creation.yaml'
  - src: 'telemetry/common/telemetry_secret_creation.yaml.j2'
    dest: 'telemetry_secret_creation.yaml'
    skip_when: "{{ cluster_id_present | default(false) }}"
  - src: 'telemetry/kustomization.yaml.j2'
    dest: 'kustomization.yaml'

# Usage: check_pxe_changes.yml
backup_pxe_mapping_ldms_path: "/opt/omnia/telemetry/backup_pxe_mapping_ldms.csv"
pxe_first_run_msg: "First discovery run detected. Saving PXE mapping backup. LDMS restart not required."
pxe_no_change_msg: "PXE mapping file has not changed since last run. Skipping LDMS restart."
pxe_changed_msg: "PXE mapping file has changed. LDMS restart will be triggered."

# Usage: restart_ldms_configs.yml
kube_vip_unreachable_msg: >-
  Kube VIP ({{ kube_vip }}) is not reachable via SSH.
  There might be issues with the k8s cluster.
  LDMS aggregator restart will be skipped.

  After discovery completes, manually restart the LDMS aggregator pod with:

  ssh {{ kube_vip }}
  kubectl rollout restart statefulset nersc-ldms-aggr -n {{ telemetry_namespace }}
  kubectl get pods -n {{ telemetry_namespace }} -l app=nersc-ldms-aggr -w

ldms_pod_ready_msg: "LDMS aggregator pod is ready."
ldms_pod_not_ready_msg: "WARNING: LDMS aggregator pod did not become ready within 120s."
ldms_store_pod_ready_msg: "LDMS store daemon pod restarted successfully and is ready"
ldms_store_pod_not_ready_msg: "LDMS store daemon pod restart failed or not ready within timeout"
ldms_store_restart_wait_seconds: 10


================================================
FILE: docs/README.rst
================================================
Omnia Documentation
-------------------

**Omnia** is an open source project hosted on `GitHub <https://github.com/dell/omnia>`_. Go to `GitHub <https://github.com/dell/omnia>`_ to view the source, open issues, ask questions, and participate in the project.

The Omnia docs are hosted here: https://omnia.readthedocs.io/en/latest/index.html and are written in reStructuredText (`.rst`).


================================================
FILE: examples/catalog/catalog_rhel.json
================================================
{
  "Catalog": {
    "Name": "Catalog",
    "Version": "1.0",
    "Identifier": "image-build",
    "FunctionalLayer": [
      {
        "Name": "login_compiler_node_aarch64",
        "FunctionalPackages": [
          "package_id_13",
          "package_id_19",
          "package_id_2",
          "package_id_3",
          "package_id_4",
          "package_id_5",
          "package_id_6",
          "package_id_7",
          "package_id_8"
        ]
      },
      {
        "Name": "login_node_x86_64",
        "FunctionalPackages": [
          "package_id_13",
          "package_id_19",
          "package_id_2",
          "package_id_3",
          "package_id_4",
          "package_id_5",
          "package_id_6",
          "package_id_7",
          "package_id_8"
        ]
      },
      {
        "Name": "service_kube_control_plane_x86_64",
        "FunctionalPackages": [
          "package_id_1",
          "package_id_20",
          "package_id_21",
          "package_id_22",
          "package_id_23",
          "package_id_24",
          "package_id_25",
          "package_id_26",
          "package_id_27",
          "package_id_28",
          "package_id_29",
          "package_id_3",
          "package_id_30",
          "package_id_31",
          "package_id_32",
          "package_id_33",
          "package_id_34",
          "package_id_35",
          "package_id_36",
          "package_id_37",
          "package_id_38",
          "package_id_39",
          "package_id_4",
          "package_id_40",
          "package_id_41",
          "package_id_42",
          "package_id_43",
          "package_id_44",
          "package_id_45",
          "package_id_46",
          "package_id_47",
          "package_id_48",
          "package_id_49",
          "package_id_50",
          "package_id_51",
          "package_id_52",
          "package_id_53",
          "package_id_54",
          "package_id_55",
          "package_id_56",
          "package_id_57",
          "package_id_58",
          "package_id_59",
          "package_id_60",
          "package_id_61",
          "package_id_62",
          "package_id_63",
          "package_id_64",
          "package_id_65",
          "package_id_66",
          "package_id_67",
          "package_id_68",
          "package_id_7",
          "package_id_8"
        ]
      },
      {
        "Name": "service_kube_node_x86_64",
        "FunctionalPackages": [
          "package_id_1",
          "package_id_20",
          "package_id_21",
          "package_id_22",
          "package_id_23",
          "package_id_24",
          "package_id_25",
          "package_id_26",
          "package_id_27",
          "package_id_28",
          "package_id_29",
          "package_id_3",
          "package_id_30",
          "package_id_31",
          "package_id_32",
          "package_id_33",
          "package_id_34",
          "package_id_35",
          "package_id_36",
          "package_id_37",
          "package_id_38",
          "package_id_39",
          "package_id_4",
          "package_id_40",
          "package_id_41",
          "package_id_42",
          "package_id_43",
          "package_id_44",
          "package_id_45",
          "package_id_46",
          "package_id_47",
          "package_id_59",
          "package_id_69",
          "package_id_7",
          "package_id_70",
          "package_id_8"
        ]
      },
      {
        "Name": "slurm_control_node_x86_64",
        "FunctionalPackages": [
          "package_id_10",
          "package_id_11",
          "package_id_12",
          "package_id_2",
          "package_id_3",
          "package_id_4",
          "package_id_5",
          "package_id_6",
          "package_id_7",
          "package_id_71",
          "package_id_72",
          "package_id_73",
          "package_id_74",
          "package_id_8",
          "package_id_9"
        ]
      },
      {
        "Name": "slurm_node_aarch64",
        "FunctionalPackages": [
          "package_id_13",
          "package_id_14",
          "package_id_15",
          "package_id_16",
          "package_id_17",
          "package_id_18",
          "package_id_2",
          "package_id_3",
          "package_id_4",
          "package_id_5",
          "package_id_6",
          "package_id_7",
          "package_id_8"
        ]
      }
    ],
    "BaseOS": [
      {
        "Name": "RHEL",
        "Version": "10.0",
        "osPackages": [
          "os_package_id_1",
          "os_package_id_10",
          "os_package_id_11",
          "os_package_id_12",
          "os_package_id_13",
          "os_package_id_14",
          "os_package_id_15",
          "os_package_id_16",
          "os_package_id_17",
          "os_package_id_18",
          "os_package_id_19",
          "os_package_id_2",
          "os_package_id_20",
          "os_package_id_21",
          "os_package_id_22",
          "os_package_id_23",
          "os_package_id_24",
          "os_package_id_25",
          "os_package_id_26",
          "os_package_id_27",
          "os_package_id_28",
          "os_package_id_29",
          "os_package_id_3",
          "os_package_id_30",
          "os_package_id_31",
          "os_package_id_32",
          "os_package_id_33",
          "os_package_id_34",
          "os_package_id_35",
          "os_package_id_36",
          "os_package_id_37",
          "os_package_id_38",
          "os_package_id_39",
          "os_package_id_4",
          "os_package_id_40",
          "os_package_id_41",
          "os_package_id_42",
          "os_package_id_43",
          "os_package_id_44",
          "os_package_id_45",
          "os_package_id_46",
          "os_package_id_47",
          "os_package_id_48",
          "os_package_id_49",
          "os_package_id_5",
          "os_package_id_50",
          "os_package_id_51",
          "os_package_id_52",
          "os_package_id_53",
          "os_package_id_54",
          "os_package_id_55",
          "os_package_id_56",
          "os_package_id_57",
          "os_package_id_58",
          "os_package_id_59",
          "os_package_id_6",
          "os_package_id_60",
          "os_package_id_61",
          "os_package_id_62",
          "os_package_id_63",
          "os_package_id_64",
          "os_package_id_65",
          "os_package_id_66",
          "os_package_id_67",
          "os_package_id_68",
          "os_package_id_69",
          "os_package_id_7",
          "os_package_id_70",
          "os_package_id_71",
          "os_package_id_72",
          "os_package_id_73",
          "os_package_id_74",
          "os_package_id_75",
          "os_package_id_76",
          "os_package_id_77",
          "os_package_id_78",
          "os_package_id_79",
          "os_package_id_8",
          "os_package_id_80",
          "os_package_id_81",
          "os_package_id_82",
          "os_package_id_83",
          "os_package_id_84",
          "os_package_id_85",
          "os_package_id_86",
          "os_package_id_87",
          "os_package_id_88",
          "os_package_id_89",
          "os_package_id_9",
          "os_package_id_90",
          "os_package_id_91",
          "os_package_id_92",
          "os_package_id_93",
          "os_package_id_94",
          "os_package_id_95"
        ]
      }
    ],
    "Infrastructure": [],
    "Drivers": [],
    "DriverPackages": {},
    "FunctionalPackages": {
      "package_id_1": {
        "Name": "vim-enhanced",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_2": {
        "Name": "munge",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_3": {
        "Name": "firewalld",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "package_id_4": {
        "Name": "python3-firewall",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "package_id_5": {
        "Name": "pmix",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_6": {
        "Name": "nvcr.io/nvidia/hpc-benchmarks",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "image",
        "Tag": "25.09",
        "Version": "25.09"
      },
      "package_id_7": {
        "Name": "apptainer",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "epel"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "epel"
          }
        ]
      },
      "package_id_8": {
        "Name": "doca-ofed",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm_repo",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "doca"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "doca"
          }
        ]
      },
      "package_id_9": {
        "Name": "slurm-slurmctld",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_slurm_custom"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_slurm_custom"
          }
        ]
      },
      "package_id_10": {
        "Name": "slurm-slurmdbd",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_slurm_custom"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_slurm_custom"
          }
        ]
      },
      "package_id_11": {
        "Name": "python3-PyMySQL",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_12": {
        "Name": "mariadb-server",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_13": {
        "Name": "slurm-slurmd",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_slurm_custom"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_slurm_custom"
          }
        ]
      },
      "package_id_14": {
        "Name": "slurm-pam_slurm",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_slurm_custom"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_slurm_custom"
          }
        ]
      },
      "package_id_15": {
        "Name": "kernel-devel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_16": {
        "Name": "kernel-headers",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_17": {
        "Name": "cuda-run",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "iso",
        "Sources": [
          {
            "Architecture": "aarch64",
            "Uri": "https://developer.download.nvidia.com/compute/cuda/13.0.2/local_installers/cuda_13.0.2_580.95.05_linux_sbsa.run"
          },
          {
            "Architecture": "x86_64",
            "Uri": "https://developer.download.nvidia.com/compute/cuda/13.0.2/local_installers/cuda_13.0.2_580.95.05_linux.run"
          }
        ]
      },
      "package_id_18": {
        "Name": "nvhpc_2025_2511_Linux_aarch64_cuda_13.0",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64"
        ],
        "Type": "tarball",
        "Sources": [
          {
            "Architecture": "aarch64",
            "Uri": "https://developer.download.nvidia.com/hpc-sdk/25.11/nvhpc_2025_2511_Linux_aarch64_cuda_13.0.tar.gz"
          }
        ]
      },
      "package_id_19": {
        "Name": "slurm",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_slurm_custom"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_slurm_custom"
          }
        ]
      },
      "package_id_20": {
        "Name": "docker.io/library/busybox",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "1.36",
        "Version": "1.36"
      },
      "package_id_21": {
        "Name": "git",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_22": {
        "Name": "fuse-overlayfs",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_23": {
        "Name": "podman",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_24": {
        "Name": "kubeadm-1.34.1",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "kubernetes"
          }
        ]
      },
      "package_id_25": {
        "Name": "kubelet-1.34.1",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "kubernetes"
          }
        ]
      },
      "package_id_26": {
        "Name": "container-selinux",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_27": {
        "Name": "cri-o-1.34.1",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "cri-o"
          }
        ]
      },
      "package_id_28": {
        "Name": "docker.io/victoriametrics/victoria-metrics",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v1.128.0",
        "Version": "v1.128.0"
      },
      "package_id_29": {
        "Name": "docker.io/victoriametrics/vmagent",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v1.128.0",
        "Version": "v1.128.0"
      },
      "package_id_30": {
        "Name": "docker.io/victoriametrics/vmstorage",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v1.128.0-cluster",
        "Version": "v1.128.0-cluster"
      },
      "package_id_31": {
        "Name": "docker.io/victoriametrics/vminsert",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v1.128.0-cluster",
        "Version": "v1.128.0-cluster"
      },
      "package_id_32": {
        "Name": "docker.io/victoriametrics/vmselect",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v1.128.0-cluster",
        "Version": "v1.128.0-cluster"
      },
      "package_id_33": {
        "Name": "docker.io/alpine/kubectl",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "1.34.1",
        "Version": "1.34.1"
      },
      "package_id_34": {
        "Name": "docker.io/curlimages/curl",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "8.17.0",
        "Version": "8.17.0"
      },
      "package_id_35": {
        "Name": "docker.io/rmohr/activemq",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "5.15.9",
        "Version": "5.15.9"
      },
      "package_id_36": {
        "Name": "docker.io/library/mysql",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "9.3.0",
        "Version": "9.3.0"
      },
      "package_id_37": {
        "Name": "docker.io/dellhpcomniaaisolution/idrac_telemetry_receiver",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "1.2",
        "Version": "1.2"
      },
      "package_id_38": {
        "Name": "docker.io/dellhpcomniaaisolution/kafkapump",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "1.2",
        "Version": "1.2"
      },
      "package_id_39": {
        "Name": "docker.io/dellhpcomniaaisolution/victoriapump",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "1.2",
        "Version": "1.2"
      },
      "package_id_40": {
        "Name": "cryptography==45.0.7",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "pip_module"
      },
      "package_id_41": {
        "Name": "omsdk==1.2.518",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "pip_module"
      },
      "package_id_42": {
        "Name": "cffi==1.17.1",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "pip_module"
      },
      "package_id_43": {
        "Name": "quay.io/strimzi/operator",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "0.48.0",
        "Version": "0.48.0"
      },
      "package_id_44": {
        "Name": "quay.io/strimzi/kafka",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "0.48.0-kafka-4.1.0",
        "Version": "0.48.0-kafka-4.1.0"
      },
      "package_id_45": {
        "Name": "docker.io/dellhpcomniaaisolution/ubuntu-ldms",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "1.0",
        "Version": "1.0"
      },
      "package_id_46": {
        "Name": "strimzi-kafka-operator-helm-3-chart-0.48.0",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "tarball",
        "Sources": [
          {
            "Architecture": "x86_64",
            "Uri": "https://github.com/strimzi/strimzi-kafka-operator/releases/download/0.48.0/strimzi-kafka-operator-helm-3-chart-0.48.0.tgz"
          }
        ]
      },
      "package_id_47": {
        "Name": "quay.io/strimzi/kafka-bridge",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "0.33.1",
        "Version": "0.33.1"
      },
      "package_id_48": {
        "Name": "ghcr.io/kube-vip/kube-vip",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v0.8.9",
        "Version": "v0.8.9"
      },
      "package_id_49": {
        "Name": "registry.k8s.io/kube-apiserver",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v1.34.1",
        "Version": "v1.34.1"
      },
      "package_id_50": {
        "Name": "registry.k8s.io/kube-controller-manager",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v1.34.1",
        "Version": "v1.34.1"
      },
      "package_id_51": {
        "Name": "registry.k8s.io/kube-scheduler",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v1.34.1",
        "Version": "v1.34.1"
      },
      "package_id_52": {
        "Name": "registry.k8s.io/kube-proxy",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v1.34.1",
        "Version": "v1.34.1"
      },
      "package_id_53": {
        "Name": "registry.k8s.io/coredns/coredns",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v1.12.1",
        "Version": "v1.12.1"
      },
      "package_id_54": {
        "Name": "registry.k8s.io/pause",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "3.10.1",
        "Version": "3.10.1"
      },
      "package_id_55": {
        "Name": "registry.k8s.io/etcd",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "3.6.4-0",
        "Version": "3.6.4-0"
      },
      "package_id_56": {
        "Name": "docker.io/calico/cni",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v3.30.3",
        "Version": "v3.30.3"
      },
      "package_id_57": {
        "Name": "docker.io/calico/kube-controllers",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v3.30.3",
        "Version": "v3.30.3"
      },
      "package_id_58": {
        "Name": "docker.io/calico/node",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v3.30.3",
        "Version": "v3.30.3"
      },
      "package_id_59": {
        "Name": "quay.io/metallb/speaker",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v0.15.2",
        "Version": "v0.15.2"
      },
      "package_id_60": {
        "Name": "kubectl-1.34.1",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "kubernetes"
          }
        ]
      },
      "package_id_61": {
        "Name": "prettytable==3.14.0",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "pip_module"
      },
      "package_id_62": {
        "Name": "python3-3.12.9",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "package_id_63": {
        "Name": "kubernetes==33.1.0",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "pip_module"
      },
      "package_id_64": {
        "Name": "PyMySQL==1.1.2",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "pip_module"
      },
      "package_id_65": {
        "Name": "calico-v3.30.3",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "manifest",
        "Sources": [
          {
            "Architecture": "x86_64",
            "Uri": "https://raw.githubusercontent.com/projectcalico/calico/v3.30.3/manifests/calico.yaml"
          }
        ]
      },
      "package_id_66": {
        "Name": "metallb-native-v0.15.2",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "manifest",
        "Sources": [
          {
            "Architecture": "x86_64",
            "Uri": "https://raw.githubusercontent.com/metallb/metallb/v0.15.2/config/manifests/metallb-native.yaml"
          }
        ]
      },
      "package_id_67": {
        "Name": "helm-v3.19.0-amd64",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "tarball",
        "Sources": [
          {
            "Architecture": "x86_64",
            "Uri": "https://get.helm.sh/helm-v3.19.0-linux-amd64.tar.gz"
          }
        ]
      },
      "package_id_68": {
        "Name": "nfs-subdir-external-provisioner-4.0.18",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "tarball",
        "Sources": [
          {
            "Architecture": "x86_64",
            "Uri": "https://github.com/kubernetes-sigs/nfs-subdir-external-provisioner/releases/download/nfs-subdir-external-provisioner-4.0.18/nfs-subdir-external-provisioner-4.0.18.tgz"
          }
        ]
      },
      "package_id_69": {
        "Name": "registry.k8s.io/sig-storage/nfs-subdir-external-provisioner",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v4.0.2",
        "Version": "v4.0.2"
      },
      "package_id_70": {
        "Name": "quay.io/metallb/controller",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v0.15.2",
        "Version": "v0.15.2"
      },
      "package_id_71": {
        "Name": "iscsi-initiator-utils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "package_id_72": {
        "Name": "device-mapper-multipath",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "package_id_73": {
        "Name": "sg3_utils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "package_id_74": {
        "Name": "lsscsi",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "package_id_75": {
        "Name": "nvhpc_2025_2511_Linux_x86_64_cuda_13.0",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "tarball",
        "Sources": [
          {
            "Architecture": "x86_64",
            "Uri": "https://developer.download.nvidia.com/hpc-sdk/25.11/nvhpc_2025_2511_Linux_x86_64_cuda_13.0.tar.gz"
          }
        ]
      }
    },
    "OSPackages": {
      "os_package_id_1": {
        "Name": "which",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_2": {
        "Name": "tcpdump",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_3": {
        "Name": "traceroute",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_4": {
        "Name": "iperf3",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_5": {
        "Name": "fping",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "epel"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "epel"
          }
        ]
      },
      "os_package_id_6": {
        "Name": "dmidecode",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_7": {
        "Name": "hwloc",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_8": {
        "Name": "hwloc-libs",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_9": {
        "Name": "lshw",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_10": {
        "Name": "pciutils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_11": {
        "Name": "emacs",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_12": {
        "Name": "zsh",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_13": {
        "Name": "openssh",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_14": {
        "Name": "openssh-server",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_15": {
        "Name": "openssh-clients",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_16": {
        "Name": "rsync",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_17": {
        "Name": "file",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_18": {
        "Name": "libcurl",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_19": {
        "Name": "tar",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_20": {
        "Name": "bzip2",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_21": {
        "Name": "man-db",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_22": {
        "Name": "man-pages",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_23": {
        "Name": "strace",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_24": {
        "Name": "kexec-tools",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_25": {
        "Name": "openssl-devel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_26": {
        "Name": "ipmitool",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_27": {
        "Name": "gdb",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_28": {
        "Name": "gdb-gdbserver",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_29": {
        "Name": "lldb",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_30": {
        "Name": "lldb-devel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_31": {
        "Name": "valgrind",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_32": {
        "Name": "valgrind-devel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_33": {
        "Name": "ltrace",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_34": {
        "Name": "kernel-tools",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_35": {
        "Name": "perf",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_36": {
        "Name": "papi",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_37": {
        "Name": "papi-devel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_38": {
        "Name": "papi-libs",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_39": {
        "Name": "cmake",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_40": {
        "Name": "make",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_41": {
        "Name": "autoconf",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_42": {
        "Name": "automake",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_43": {
        "Name": "libtool",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_44": {
        "Name": "gcc",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_45": {
        "Name": "gcc-c++",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_46": {
        "Name": "gcc-gfortran",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_47": {
        "Name": "binutils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_48": {
        "Name": "binutils-devel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_49": {
        "Name": "clustershell",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "epel"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "epel"
          }
        ]
      },
      "os_package_id_50": {
        "Name": "bash-completion",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_51": {
        "Name": "systemd",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_52": {
        "Name": "systemd-udev",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_53": {
        "Name": "kernel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_54": {
        "Name": "dracut",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_55": {
        "Name": "dracut-live",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_56": {
        "Name": "dracut-network",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_57": {
        "Name": "squashfs-tools",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_58": {
        "Name": "nfs-utils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_59": {
        "Name": "nfs4-acl-tools",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_60": {
        "Name": "NetworkManager",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_61": {
        "Name": "nm-connection-editor",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_62": {
        "Name": "iproute",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_63": {
        "Name": "iputils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_64": {
        "Name": "curl",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_65": {
        "Name": "bash",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_66": {
        "Name": "coreutils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_67": {
        "Name": "grep",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_68": {
        "Name": "sed",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_69": {
        "Name": "gawk",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_70": {
        "Name": "findutils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_71": {
        "Name": "util-linux",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_72": {
        "Name": "kbd",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_73": {
        "Name": "lsof",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_74": {
        "Name": "cryptsetup",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_75": {
        "Name": "lvm2",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_76": {
        "Name": "device-mapper",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_77": {
        "Name": "rsyslog",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_78": {
        "Name": "chrony",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_79": {
        "Name": "sudo",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_80": {
        "Name": "gzip",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_81": {
        "Name": "wget",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_82": {
        "Name": "cloud-init",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_83": {
        "Name": "glibc-langpack-en",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_84": {
        "Name": "gedit",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "epel"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "epel"
          }
        ]
      },
      "os_package_id_85": {
        "Name": "docker.io/dellhpcomniaaisolution/image-build-aarch64",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64"
        ],
        "Type": "image",
        "Tag": "1.1",
        "Version": "1.1"
      },
      "os_package_id_86": {
        "Name": "python3-devel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_87": {
        "Name": "python3-cython",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_codeready-builder"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_codeready-builder"
          }
        ]
      },
      "os_package_id_88": {
        "Name": "openssl-libs",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_89": {
        "Name": "ovis-ldms",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_ldms"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_ldms"
          }
        ]
      },
      "os_package_id_90": {
        "Name": "openldap-clients",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_91": {
        "Name": "nss-pam-ldapd",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "epel"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "epel"
          }
        ]
      },
      "os_package_id_92": {
        "Name": "sssd",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_93": {
        "Name": "oddjob-mkhomedir",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_94": {
        "Name": "authselect",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_95": {
        "Name": "docker.io/dellhpcomniaaisolution/image-build-el10",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "1.1",
        "Version": "1.1"
      }
    },
    "Miscellaneous": [],
    "InfrastructurePackages": {}
  }
}

================================================
FILE: examples/catalog/catalog_rhel_aarch64_with_slurm_only.json
================================================
{
  "Catalog": {
    "Name": "Catalog",
    "Version": "1.0",
    "Identifier": "image-build",
    "FunctionalLayer": [
      {
        "Name": "login_compiler_node_aarch64",
        "FunctionalPackages": [
          "package_id_1",
          "package_id_12",
          "package_id_18",
          "package_id_2",
          "package_id_3",
          "package_id_4",
          "package_id_5",
          "package_id_6",
          "package_id_7"
        ]
      },
      {
        "Name": "login_node_x86_64",
        "FunctionalPackages": [
          "package_id_1",
          "package_id_12",
          "package_id_18",
          "package_id_2",
          "package_id_3",
          "package_id_4",
          "package_id_5",
          "package_id_6",
          "package_id_7"
        ]
      },
      {
        "Name": "slurm_control_node_x86_64",
        "FunctionalPackages": [
          "package_id_1",
          "package_id_10",
          "package_id_11",
          "package_id_19",
          "package_id_2",
          "package_id_20",
          "package_id_21",
          "package_id_22",
          "package_id_3",
          "package_id_4",
          "package_id_5",
          "package_id_6",
          "package_id_7",
          "package_id_8",
          "package_id_9"
        ]
      },
      {
        "Name": "slurm_node_aarch64",
        "FunctionalPackages": [
          "package_id_1",
          "package_id_12",
          "package_id_13",
          "package_id_14",
          "package_id_15",
          "package_id_16",
          "package_id_17",
          "package_id_2",
          "package_id_3",
          "package_id_4",
          "package_id_5",
          "package_id_6",
          "package_id_7"
        ]
      }
    ],
    "BaseOS": [
      {
        "Name": "RHEL",
        "Version": "10.0",
        "osPackages": [
          "os_package_id_1",
          "os_package_id_10",
          "os_package_id_11",
          "os_package_id_12",
          "os_package_id_13",
          "os_package_id_14",
          "os_package_id_15",
          "os_package_id_16",
          "os_package_id_17",
          "os_package_id_18",
          "os_package_id_19",
          "os_package_id_2",
          "os_package_id_20",
          "os_package_id_21",
          "os_package_id_22",
          "os_package_id_23",
          "os_package_id_24",
          "os_package_id_25",
          "os_package_id_26",
          "os_package_id_27",
          "os_package_id_28",
          "os_package_id_29",
          "os_package_id_3",
          "os_package_id_30",
          "os_package_id_31",
          "os_package_id_32",
          "os_package_id_33",
          "os_package_id_34",
          "os_package_id_35",
          "os_package_id_36",
          "os_package_id_37",
          "os_package_id_38",
          "os_package_id_39",
          "os_package_id_4",
          "os_package_id_40",
          "os_package_id_41",
          "os_package_id_42",
          "os_package_id_43",
          "os_package_id_44",
          "os_package_id_45",
          "os_package_id_46",
          "os_package_id_47",
          "os_package_id_48",
          "os_package_id_49",
          "os_package_id_5",
          "os_package_id_50",
          "os_package_id_51",
          "os_package_id_52",
          "os_package_id_53",
          "os_package_id_54",
          "os_package_id_55",
          "os_package_id_56",
          "os_package_id_57",
          "os_package_id_58",
          "os_package_id_59",
          "os_package_id_6",
          "os_package_id_60",
          "os_package_id_61",
          "os_package_id_62",
          "os_package_id_63",
          "os_package_id_64",
          "os_package_id_65",
          "os_package_id_66",
          "os_package_id_67",
          "os_package_id_68",
          "os_package_id_69",
          "os_package_id_7",
          "os_package_id_70",
          "os_package_id_71",
          "os_package_id_72",
          "os_package_id_73",
          "os_package_id_74",
          "os_package_id_75",
          "os_package_id_76",
          "os_package_id_77",
          "os_package_id_78",
          "os_package_id_79",
          "os_package_id_8",
          "os_package_id_80",
          "os_package_id_81",
          "os_package_id_82",
          "os_package_id_83",
          "os_package_id_84",
          "os_package_id_85",
          "os_package_id_86",
          "os_package_id_87",
          "os_package_id_88",
          "os_package_id_89",
          "os_package_id_9",
          "os_package_id_90",
          "os_package_id_91",
          "os_package_id_92"
        ]
      }
    ],
    "Infrastructure": [],
    "Drivers": [],
    "DriverPackages": {},
    "FunctionalPackages": {
      "package_id_1": {
        "Name": "munge",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_2": {
        "Name": "firewalld",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "package_id_3": {
        "Name": "python3-firewall",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "package_id_4": {
        "Name": "pmix",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_5": {
        "Name": "nvcr.io/nvidia/hpc-benchmarks",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "image",
        "Tag": "25.09",
        "Version": "25.09"
      },
      "package_id_6": {
        "Name": "apptainer",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "epel"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "epel"
          }
        ]
      },
      "package_id_7": {
        "Name": "doca-ofed",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm_repo",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "doca"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "doca"
          }
        ]
      },
      "package_id_8": {
        "Name": "slurm-slurmctld",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_slurm_custom"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_slurm_custom"
          }
        ]
      },
      "package_id_9": {
        "Name": "slurm-slurmdbd",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_slurm_custom"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_slurm_custom"
          }
        ]
      },
      "package_id_10": {
        "Name": "python3-PyMySQL",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_11": {
        "Name": "mariadb-server",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_12": {
        "Name": "slurm-slurmd",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_slurm_custom"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_slurm_custom"
          }
        ]
      },
      "package_id_13": {
        "Name": "slurm-pam_slurm",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_slurm_custom"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_slurm_custom"
          }
        ]
      },
      "package_id_14": {
        "Name": "kernel-devel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_15": {
        "Name": "kernel-headers",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_16": {
        "Name": "cuda-run",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "iso",
        "Sources": [
          {
            "Architecture": "aarch64",
            "Uri": "https://developer.download.nvidia.com/compute/cuda/13.0.2/local_installers/cuda_13.0.2_580.95.05_linux_sbsa.run"
          },
          {
            "Architecture": "x86_64",
            "Uri": "https://developer.download.nvidia.com/compute/cuda/13.0.2/local_installers/cuda_13.0.2_580.95.05_linux.run"
          }
        ]
      },
      "package_id_17": {
        "Name": "nvhpc_2025_2511_Linux_aarch64_cuda_13.0",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64"
        ],
        "Type": "tarball",
        "Sources": [
          {
            "Architecture": "aarch64",
            "Uri": "https://developer.download.nvidia.com/hpc-sdk/25.11/nvhpc_2025_2511_Linux_aarch64_cuda_13.0.tar.gz"
          }
        ]
      },
      "package_id_18": {
        "Name": "slurm",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_slurm_custom"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_slurm_custom"
          }
        ]
      },
      "package_id_19": {
        "Name": "iscsi-initiator-utils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "package_id_20": {
        "Name": "device-mapper-multipath",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "package_id_21": {
        "Name": "sg3_utils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "package_id_22": {
        "Name": "lsscsi",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "package_id_23": {
        "Name": "nvhpc_2025_2511_Linux_x86_64_cuda_13.0",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "tarball",
        "Sources": [
          {
            "Architecture": "x86_64",
            "Uri": "https://developer.download.nvidia.com/hpc-sdk/25.11/nvhpc_2025_2511_Linux_x86_64_cuda_13.0.tar.gz"
          }
        ]
      }
    },
    "OSPackages": {
      "os_package_id_1": {
        "Name": "which",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_2": {
        "Name": "tcpdump",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_3": {
        "Name": "traceroute",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_4": {
        "Name": "iperf3",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_5": {
        "Name": "fping",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "epel"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "epel"
          }
        ]
      },
      "os_package_id_6": {
        "Name": "dmidecode",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_7": {
        "Name": "hwloc",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_8": {
        "Name": "hwloc-libs",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_9": {
        "Name": "lshw",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_10": {
        "Name": "pciutils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_11": {
        "Name": "vim-enhanced",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_12": {
        "Name": "emacs",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_13": {
        "Name": "zsh",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_14": {
        "Name": "openssh",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_15": {
        "Name": "openssh-server",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_16": {
        "Name": "openssh-clients",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_17": {
        "Name": "rsync",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_18": {
        "Name": "file",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_19": {
        "Name": "libcurl",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_20": {
        "Name": "tar",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_21": {
        "Name": "bzip2",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_22": {
        "Name": "man-db",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_23": {
        "Name": "man-pages",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_24": {
        "Name": "strace",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_25": {
        "Name": "kexec-tools",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_26": {
        "Name": "openssl-devel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_27": {
        "Name": "ipmitool",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_28": {
        "Name": "gdb",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_29": {
        "Name": "gdb-gdbserver",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_30": {
        "Name": "lldb",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_31": {
        "Name": "lldb-devel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_32": {
        "Name": "valgrind",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_33": {
        "Name": "valgrind-devel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_34": {
        "Name": "ltrace",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_35": {
        "Name": "kernel-tools",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_36": {
        "Name": "perf",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_37": {
        "Name": "papi",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_38": {
        "Name": "papi-devel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_39": {
        "Name": "papi-libs",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_40": {
        "Name": "cmake",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_41": {
        "Name": "make",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_42": {
        "Name": "autoconf",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_43": {
        "Name": "automake",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_44": {
        "Name": "libtool",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_45": {
        "Name": "gcc",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_46": {
        "Name": "gcc-c++",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_47": {
        "Name": "gcc-gfortran",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_48": {
        "Name": "binutils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_49": {
        "Name": "binutils-devel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_50": {
        "Name": "clustershell",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "epel"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "epel"
          }
        ]
      },
      "os_package_id_51": {
        "Name": "bash-completion",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_52": {
        "Name": "systemd",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_53": {
        "Name": "systemd-udev",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_54": {
        "Name": "kernel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_55": {
        "Name": "dracut",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_56": {
        "Name": "dracut-live",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_57": {
        "Name": "dracut-network",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_58": {
        "Name": "squashfs-tools",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_59": {
        "Name": "nfs-utils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_60": {
        "Name": "nfs4-acl-tools",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_61": {
        "Name": "NetworkManager",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_62": {
        "Name": "nm-connection-editor",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_63": {
        "Name": "iproute",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_64": {
        "Name": "iputils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_65": {
        "Name": "curl",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_66": {
        "Name": "bash",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_67": {
        "Name": "coreutils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_68": {
        "Name": "grep",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_69": {
        "Name": "sed",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_70": {
        "Name": "gawk",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_71": {
        "Name": "findutils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_72": {
        "Name": "util-linux",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_73": {
        "Name": "kbd",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_74": {
        "Name": "lsof",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_75": {
        "Name": "cryptsetup",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_76": {
        "Name": "lvm2",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_77": {
        "Name": "device-mapper",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_78": {
        "Name": "rsyslog",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_79": {
        "Name": "chrony",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_80": {
        "Name": "sudo",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_81": {
        "Name": "gzip",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_82": {
        "Name": "wget",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_83": {
        "Name": "cloud-init",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_84": {
        "Name": "glibc-langpack-en",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_85": {
        "Name": "gedit",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "epel"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "epel"
          }
        ]
      },
      "os_package_id_86": {
        "Name": "docker.io/dellhpcomniaaisolution/image-build-aarch64",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64"
        ],
        "Type": "image",
        "Tag": "1.1",
        "Version": "1.1"
      },
      "os_package_id_87": {
        "Name": "openldap-clients",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_88": {
        "Name": "nss-pam-ldapd",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "epel"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "epel"
          }
        ]
      },
      "os_package_id_89": {
        "Name": "sssd",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_90": {
        "Name": "oddjob-mkhomedir",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_91": {
        "Name": "authselect",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_92": {
        "Name": "docker.io/dellhpcomniaaisolution/image-build-el10",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "1.1",
        "Version": "1.1"
      }
    },
    "Miscellaneous": [],
    "InfrastructurePackages": {}
  }
}

================================================
FILE: examples/catalog/catalog_rhel_with_ucx_openmpi.json
================================================
{
  "Catalog": {
    "Name": "Catalog",
    "Version": "1.0",
    "Identifier": "image-build",
    "FunctionalLayer": [
      {
        "Name": "login_compiler_node_aarch64",
        "FunctionalPackages": [
          "package_id_13",
          "package_id_19",
          "package_id_2",
          "package_id_3",
          "package_id_4",
          "package_id_5",
          "package_id_6",
          "package_id_7",
          "package_id_8"
        ]
      },
      {
        "Name": "login_node_x86_64",
        "FunctionalPackages": [
          "package_id_13",
          "package_id_19",
          "package_id_2",
          "package_id_3",
          "package_id_4",
          "package_id_5",
          "package_id_6",
          "package_id_7",
          "package_id_8"
        ]
      },
      {
        "Name": "service_kube_control_plane_x86_64",
        "FunctionalPackages": [
          "package_id_1",
          "package_id_20",
          "package_id_21",
          "package_id_22",
          "package_id_23",
          "package_id_24",
          "package_id_25",
          "package_id_26",
          "package_id_27",
          "package_id_28",
          "package_id_29",
          "package_id_3",
          "package_id_30",
          "package_id_31",
          "package_id_32",
          "package_id_33",
          "package_id_34",
          "package_id_35",
          "package_id_36",
          "package_id_37",
          "package_id_38",
          "package_id_39",
          "package_id_4",
          "package_id_40",
          "package_id_41",
          "package_id_42",
          "package_id_43",
          "package_id_44",
          "package_id_45",
          "package_id_46",
          "package_id_47",
          "package_id_48",
          "package_id_49",
          "package_id_50",
          "package_id_51",
          "package_id_52",
          "package_id_53",
          "package_id_54",
          "package_id_55",
          "package_id_56",
          "package_id_57",
          "package_id_58",
          "package_id_59",
          "package_id_60",
          "package_id_61",
          "package_id_62",
          "package_id_63",
          "package_id_64",
          "package_id_65",
          "package_id_66",
          "package_id_67",
          "package_id_68",
          "package_id_7",
          "package_id_8"
        ]
      },
      {
        "Name": "service_kube_node_x86_64",
        "FunctionalPackages": [
          "package_id_1",
          "package_id_20",
          "package_id_21",
          "package_id_22",
          "package_id_23",
          "package_id_24",
          "package_id_25",
          "package_id_26",
          "package_id_27",
          "package_id_28",
          "package_id_29",
          "package_id_3",
          "package_id_30",
          "package_id_31",
          "package_id_32",
          "package_id_33",
          "package_id_34",
          "package_id_35",
          "package_id_36",
          "package_id_37",
          "package_id_38",
          "package_id_39",
          "package_id_4",
          "package_id_40",
          "package_id_41",
          "package_id_42",
          "package_id_43",
          "package_id_44",
          "package_id_45",
          "package_id_46",
          "package_id_47",
          "package_id_59",
          "package_id_69",
          "package_id_7",
          "package_id_70",
          "package_id_8"
        ]
      },
      {
        "Name": "slurm_control_node_x86_64",
        "FunctionalPackages": [
          "package_id_10",
          "package_id_11",
          "package_id_12",
          "package_id_2",
          "package_id_3",
          "package_id_4",
          "package_id_5",
          "package_id_6",
          "package_id_7",
          "package_id_71",
          "package_id_72",
          "package_id_73",
          "package_id_74",
          "package_id_8",
          "package_id_9"
        ]
      },
      {
        "Name": "slurm_node_aarch64",
        "FunctionalPackages": [
          "package_id_13",
          "package_id_14",
          "package_id_15",
          "package_id_16",
          "package_id_17",
          "package_id_18",
          "package_id_2",
          "package_id_3",
          "package_id_4",
          "package_id_5",
          "package_id_6",
          "package_id_7",
          "package_id_8"
        ]
      }
    ],
    "BaseOS": [
      {
        "Name": "RHEL",
        "Version": "10.0",
        "osPackages": [
          "os_package_id_1",
          "os_package_id_10",
          "os_package_id_11",
          "os_package_id_12",
          "os_package_id_13",
          "os_package_id_14",
          "os_package_id_15",
          "os_package_id_16",
          "os_package_id_17",
          "os_package_id_18",
          "os_package_id_19",
          "os_package_id_2",
          "os_package_id_20",
          "os_package_id_21",
          "os_package_id_22",
          "os_package_id_23",
          "os_package_id_24",
          "os_package_id_25",
          "os_package_id_26",
          "os_package_id_27",
          "os_package_id_28",
          "os_package_id_29",
          "os_package_id_3",
          "os_package_id_30",
          "os_package_id_31",
          "os_package_id_32",
          "os_package_id_33",
          "os_package_id_34",
          "os_package_id_35",
          "os_package_id_36",
          "os_package_id_37",
          "os_package_id_38",
          "os_package_id_39",
          "os_package_id_4",
          "os_package_id_40",
          "os_package_id_41",
          "os_package_id_42",
          "os_package_id_43",
          "os_package_id_44",
          "os_package_id_45",
          "os_package_id_46",
          "os_package_id_47",
          "os_package_id_48",
          "os_package_id_49",
          "os_package_id_5",
          "os_package_id_50",
          "os_package_id_51",
          "os_package_id_52",
          "os_package_id_53",
          "os_package_id_54",
          "os_package_id_55",
          "os_package_id_56",
          "os_package_id_57",
          "os_package_id_58",
          "os_package_id_59",
          "os_package_id_6",
          "os_package_id_60",
          "os_package_id_61",
          "os_package_id_62",
          "os_package_id_63",
          "os_package_id_64",
          "os_package_id_65",
          "os_package_id_66",
          "os_package_id_67",
          "os_package_id_68",
          "os_package_id_69",
          "os_package_id_7",
          "os_package_id_70",
          "os_package_id_71",
          "os_package_id_72",
          "os_package_id_73",
          "os_package_id_74",
          "os_package_id_75",
          "os_package_id_76",
          "os_package_id_77",
          "os_package_id_78",
          "os_package_id_79",
          "os_package_id_8",
          "os_package_id_80",
          "os_package_id_81",
          "os_package_id_82",
          "os_package_id_83",
          "os_package_id_84",
          "os_package_id_85",
          "os_package_id_86",
          "os_package_id_87",
          "os_package_id_88",
          "os_package_id_89",
          "os_package_id_9",
          "os_package_id_90",
          "os_package_id_91",
          "os_package_id_92",
          "os_package_id_93",
          "os_package_id_94",
          "os_package_id_95",
          "os_package_id_96",
          "os_package_id_97",
          "os_package_id_98",
          "os_package_id_99"
        ]
      }
    ],
    "Infrastructure": [],
    "Drivers": [],
    "DriverPackages": {},
    "FunctionalPackages": {
      "package_id_1": {
        "Name": "vim-enhanced",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_2": {
        "Name": "munge",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_3": {
        "Name": "firewalld",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "package_id_4": {
        "Name": "python3-firewall",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "package_id_5": {
        "Name": "pmix",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_6": {
        "Name": "nvcr.io/nvidia/hpc-benchmarks",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "image",
        "Tag": "25.09",
        "Version": "25.09"
      },
      "package_id_7": {
        "Name": "apptainer",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "epel"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "epel"
          }
        ]
      },
      "package_id_8": {
        "Name": "doca-ofed",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm_repo",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "doca"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "doca"
          }
        ]
      },
      "package_id_9": {
        "Name": "slurm-slurmctld",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_slurm_custom"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_slurm_custom"
          }
        ]
      },
      "package_id_10": {
        "Name": "slurm-slurmdbd",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_slurm_custom"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_slurm_custom"
          }
        ]
      },
      "package_id_11": {
        "Name": "python3-PyMySQL",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_12": {
        "Name": "mariadb-server",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_13": {
        "Name": "slurm-slurmd",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_slurm_custom"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_slurm_custom"
          }
        ]
      },
      "package_id_14": {
        "Name": "slurm-pam_slurm",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_slurm_custom"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_slurm_custom"
          }
        ]
      },
      "package_id_15": {
        "Name": "kernel-devel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_16": {
        "Name": "kernel-headers",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_17": {
        "Name": "cuda-run",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "iso",
        "Sources": [
          {
            "Architecture": "aarch64",
            "Uri": "https://developer.download.nvidia.com/compute/cuda/13.0.2/local_installers/cuda_13.0.2_580.95.05_linux_sbsa.run"
          },
          {
            "Architecture": "x86_64",
            "Uri": "https://developer.download.nvidia.com/compute/cuda/13.0.2/local_installers/cuda_13.0.2_580.95.05_linux.run"
          }
        ]
      },
      "package_id_18": {
        "Name": "nvhpc_2025_2511_Linux_aarch64_cuda_13.0",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64"
        ],
        "Type": "tarball",
        "Sources": [
          {
            "Architecture": "aarch64",
            "Uri": "https://developer.download.nvidia.com/hpc-sdk/25.11/nvhpc_2025_2511_Linux_aarch64_cuda_13.0.tar.gz"
          }
        ]
      },
      "package_id_19": {
        "Name": "slurm",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_slurm_custom"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_slurm_custom"
          }
        ]
      },
      "package_id_20": {
        "Name": "docker.io/library/busybox",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "1.36",
        "Version": "1.36"
      },
      "package_id_21": {
        "Name": "git",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_22": {
        "Name": "fuse-overlayfs",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_23": {
        "Name": "podman",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_24": {
        "Name": "kubeadm-1.34.1",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "kubernetes"
          }
        ]
      },
      "package_id_25": {
        "Name": "kubelet-1.34.1",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "kubernetes"
          }
        ]
      },
      "package_id_26": {
        "Name": "container-selinux",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_27": {
        "Name": "cri-o-1.34.1",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "cri-o"
          }
        ]
      },
      "package_id_28": {
        "Name": "docker.io/victoriametrics/victoria-metrics",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v1.128.0",
        "Version": "v1.128.0"
      },
      "package_id_29": {
        "Name": "docker.io/victoriametrics/vmagent",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v1.128.0",
        "Version": "v1.128.0"
      },
      "package_id_30": {
        "Name": "docker.io/victoriametrics/vmstorage",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v1.128.0-cluster",
        "Version": "v1.128.0-cluster"
      },
      "package_id_31": {
        "Name": "docker.io/victoriametrics/vminsert",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v1.128.0-cluster",
        "Version": "v1.128.0-cluster"
      },
      "package_id_32": {
        "Name": "docker.io/victoriametrics/vmselect",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v1.128.0-cluster",
        "Version": "v1.128.0-cluster"
      },
      "package_id_33": {
        "Name": "docker.io/alpine/kubectl",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "1.34.1",
        "Version": "1.34.1"
      },
      "package_id_34": {
        "Name": "docker.io/curlimages/curl",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "8.17.0",
        "Version": "8.17.0"
      },
      "package_id_35": {
        "Name": "docker.io/rmohr/activemq",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "5.15.9",
        "Version": "5.15.9"
      },
      "package_id_36": {
        "Name": "docker.io/library/mysql",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "9.3.0",
        "Version": "9.3.0"
      },
      "package_id_37": {
        "Name": "docker.io/dellhpcomniaaisolution/idrac_telemetry_receiver",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "1.2",
        "Version": "1.2"
      },
      "package_id_38": {
        "Name": "docker.io/dellhpcomniaaisolution/kafkapump",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "1.2",
        "Version": "1.2"
      },
      "package_id_39": {
        "Name": "docker.io/dellhpcomniaaisolution/victoriapump",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "1.2",
        "Version": "1.2"
      },
      "package_id_40": {
        "Name": "cryptography==45.0.7",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "pip_module"
      },
      "package_id_41": {
        "Name": "omsdk==1.2.518",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "pip_module"
      },
      "package_id_42": {
        "Name": "cffi==1.17.1",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "pip_module"
      },
      "package_id_43": {
        "Name": "quay.io/strimzi/operator",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "0.48.0",
        "Version": "0.48.0"
      },
      "package_id_44": {
        "Name": "quay.io/strimzi/kafka",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "0.48.0-kafka-4.1.0",
        "Version": "0.48.0-kafka-4.1.0"
      },
      "package_id_45": {
        "Name": "docker.io/dellhpcomniaaisolution/ubuntu-ldms",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "1.0",
        "Version": "1.0"
      },
      "package_id_46": {
        "Name": "strimzi-kafka-operator-helm-3-chart-0.48.0",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "tarball",
        "Sources": [
          {
            "Architecture": "x86_64",
            "Uri": "https://github.com/strimzi/strimzi-kafka-operator/releases/download/0.48.0/strimzi-kafka-operator-helm-3-chart-0.48.0.tgz"
          }
        ]
      },
      "package_id_47": {
        "Name": "quay.io/strimzi/kafka-bridge",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "0.33.1",
        "Version": "0.33.1"
      },
      "package_id_48": {
        "Name": "ghcr.io/kube-vip/kube-vip",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v0.8.9",
        "Version": "v0.8.9"
      },
      "package_id_49": {
        "Name": "registry.k8s.io/kube-apiserver",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v1.34.1",
        "Version": "v1.34.1"
      },
      "package_id_50": {
        "Name": "registry.k8s.io/kube-controller-manager",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v1.34.1",
        "Version": "v1.34.1"
      },
      "package_id_51": {
        "Name": "registry.k8s.io/kube-scheduler",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v1.34.1",
        "Version": "v1.34.1"
      },
      "package_id_52": {
        "Name": "registry.k8s.io/kube-proxy",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v1.34.1",
        "Version": "v1.34.1"
      },
      "package_id_53": {
        "Name": "registry.k8s.io/coredns/coredns",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v1.12.1",
        "Version": "v1.12.1"
      },
      "package_id_54": {
        "Name": "registry.k8s.io/pause",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "3.10.1",
        "Version": "3.10.1"
      },
      "package_id_55": {
        "Name": "registry.k8s.io/etcd",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "3.6.4-0",
        "Version": "3.6.4-0"
      },
      "package_id_56": {
        "Name": "docker.io/calico/cni",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v3.30.3",
        "Version": "v3.30.3"
      },
      "package_id_57": {
        "Name": "docker.io/calico/kube-controllers",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v3.30.3",
        "Version": "v3.30.3"
      },
      "package_id_58": {
        "Name": "docker.io/calico/node",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v3.30.3",
        "Version": "v3.30.3"
      },
      "package_id_59": {
        "Name": "quay.io/metallb/speaker",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v0.15.2",
        "Version": "v0.15.2"
      },
      "package_id_60": {
        "Name": "kubectl-1.34.1",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "kubernetes"
          }
        ]
      },
      "package_id_61": {
        "Name": "prettytable==3.14.0",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "pip_module"
      },
      "package_id_62": {
        "Name": "python3-3.12.9",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "package_id_63": {
        "Name": "kubernetes==33.1.0",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "pip_module"
      },
      "package_id_64": {
        "Name": "PyMySQL==1.1.2",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "pip_module"
      },
      "package_id_65": {
        "Name": "calico-v3.30.3",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "manifest",
        "Sources": [
          {
            "Architecture": "x86_64",
            "Uri": "https://raw.githubusercontent.com/projectcalico/calico/v3.30.3/manifests/calico.yaml"
          }
        ]
      },
      "package_id_66": {
        "Name": "metallb-native-v0.15.2",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "manifest",
        "Sources": [
          {
            "Architecture": "x86_64",
            "Uri": "https://raw.githubusercontent.com/metallb/metallb/v0.15.2/config/manifests/metallb-native.yaml"
          }
        ]
      },
      "package_id_67": {
        "Name": "helm-v3.19.0-amd64",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "tarball",
        "Sources": [
          {
            "Architecture": "x86_64",
            "Uri": "https://get.helm.sh/helm-v3.19.0-linux-amd64.tar.gz"
          }
        ]
      },
      "package_id_68": {
        "Name": "nfs-subdir-external-provisioner-4.0.18",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "tarball",
        "Sources": [
          {
            "Architecture": "x86_64",
            "Uri": "https://github.com/kubernetes-sigs/nfs-subdir-external-provisioner/releases/download/nfs-subdir-external-provisioner-4.0.18/nfs-subdir-external-provisioner-4.0.18.tgz"
          }
        ]
      },
      "package_id_69": {
        "Name": "registry.k8s.io/sig-storage/nfs-subdir-external-provisioner",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v4.0.2",
        "Version": "v4.0.2"
      },
      "package_id_70": {
        "Name": "quay.io/metallb/controller",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "v0.15.2",
        "Version": "v0.15.2"
      },
      "package_id_71": {
        "Name": "iscsi-initiator-utils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "package_id_72": {
        "Name": "device-mapper-multipath",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "package_id_73": {
        "Name": "sg3_utils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "package_id_74": {
        "Name": "lsscsi",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "package_id_75": {
        "Name": "nvhpc_2025_2511_Linux_x86_64_cuda_13.0",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "tarball",
        "Sources": [
          {
            "Architecture": "x86_64",
            "Uri": "https://developer.download.nvidia.com/hpc-sdk/25.11/nvhpc_2025_2511_Linux_x86_64_cuda_13.0.tar.gz"
          }
        ]
      }
    },
    "OSPackages": {
      "os_package_id_1": {
        "Name": "which",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_2": {
        "Name": "tcpdump",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_3": {
        "Name": "traceroute",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_4": {
        "Name": "iperf3",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_5": {
        "Name": "fping",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "epel"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "epel"
          }
        ]
      },
      "os_package_id_6": {
        "Name": "dmidecode",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_7": {
        "Name": "hwloc",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_8": {
        "Name": "hwloc-libs",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_9": {
        "Name": "lshw",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_10": {
        "Name": "pciutils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_11": {
        "Name": "emacs",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_12": {
        "Name": "zsh",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_13": {
        "Name": "openssh",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_14": {
        "Name": "openssh-server",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_15": {
        "Name": "openssh-clients",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_16": {
        "Name": "rsync",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_17": {
        "Name": "file",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_18": {
        "Name": "libcurl",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_19": {
        "Name": "tar",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_20": {
        "Name": "bzip2",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_21": {
        "Name": "man-db",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_22": {
        "Name": "man-pages",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_23": {
        "Name": "strace",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_24": {
        "Name": "kexec-tools",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_25": {
        "Name": "openssl-devel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_26": {
        "Name": "ipmitool",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_27": {
        "Name": "gdb",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_28": {
        "Name": "gdb-gdbserver",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_29": {
        "Name": "lldb",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_30": {
        "Name": "lldb-devel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_31": {
        "Name": "valgrind",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_32": {
        "Name": "valgrind-devel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_33": {
        "Name": "ltrace",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_34": {
        "Name": "kernel-tools",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_35": {
        "Name": "perf",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_36": {
        "Name": "papi",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_37": {
        "Name": "papi-devel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_38": {
        "Name": "papi-libs",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_39": {
        "Name": "cmake",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_40": {
        "Name": "make",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_41": {
        "Name": "autoconf",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_42": {
        "Name": "automake",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_43": {
        "Name": "libtool",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_44": {
        "Name": "gcc",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_45": {
        "Name": "gcc-c++",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_46": {
        "Name": "gcc-gfortran",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_47": {
        "Name": "binutils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_48": {
        "Name": "binutils-devel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_49": {
        "Name": "clustershell",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "epel"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "epel"
          }
        ]
      },
      "os_package_id_50": {
        "Name": "bash-completion",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_51": {
        "Name": "systemd",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_52": {
        "Name": "systemd-udev",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_53": {
        "Name": "kernel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_54": {
        "Name": "dracut",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_55": {
        "Name": "dracut-live",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_56": {
        "Name": "dracut-network",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_57": {
        "Name": "squashfs-tools",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_58": {
        "Name": "nfs-utils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_59": {
        "Name": "nfs4-acl-tools",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_60": {
        "Name": "NetworkManager",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_61": {
        "Name": "nm-connection-editor",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_62": {
        "Name": "iproute",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_63": {
        "Name": "iputils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_64": {
        "Name": "curl",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_65": {
        "Name": "bash",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_66": {
        "Name": "coreutils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_67": {
        "Name": "grep",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_68": {
        "Name": "sed",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_69": {
        "Name": "gawk",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_70": {
        "Name": "findutils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_71": {
        "Name": "util-linux",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_72": {
        "Name": "kbd",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_73": {
        "Name": "lsof",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_74": {
        "Name": "cryptsetup",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_75": {
        "Name": "lvm2",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_76": {
        "Name": "device-mapper",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_77": {
        "Name": "rsyslog",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_78": {
        "Name": "chrony",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_79": {
        "Name": "sudo",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_80": {
        "Name": "gzip",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_81": {
        "Name": "wget",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_82": {
        "Name": "cloud-init",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_83": {
        "Name": "glibc-langpack-en",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_84": {
        "Name": "gedit",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "epel"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "epel"
          }
        ]
      },
      "os_package_id_85": {
        "Name": "docker.io/dellhpcomniaaisolution/image-build-aarch64",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64"
        ],
        "Type": "image",
        "Tag": "1.1",
        "Version": "1.1"
      },
      "os_package_id_86": {
        "Name": "python3-devel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_87": {
        "Name": "python3-cython",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_codeready-builder"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_codeready-builder"
          }
        ]
      },
      "os_package_id_88": {
        "Name": "openssl-libs",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_89": {
        "Name": "ovis-ldms",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_ldms"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_ldms"
          }
        ]
      },
      "os_package_id_90": {
        "Name": "openldap-clients",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_91": {
        "Name": "nss-pam-ldapd",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "epel"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "epel"
          }
        ]
      },
      "os_package_id_92": {
        "Name": "sssd",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_93": {
        "Name": "oddjob-mkhomedir",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_94": {
        "Name": "authselect",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_baseos"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_95": {
        "Name": "openmpi",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "tarball",
        "Version": "5.0.8",
        "Sources": [
          {
            "Architecture": "aarch64",
            "Uri": "https://download.open-mpi.org/release/open-mpi/v5.0/openmpi-5.0.8.tar.gz"
          },
          {
            "Architecture": "x86_64",
            "Uri": "https://download.open-mpi.org/release/open-mpi/v5.0/openmpi-5.0.8.tar.gz"
          }
        ]
      },
      "os_package_id_96": {
        "Name": "pmix-devel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_appstream"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_97": {
        "Name": "munge-devel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "aarch64",
            "RepoName": "aarch64_codeready-builder"
          },
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_codeready-builder"
          }
        ]
      },
      "os_package_id_98": {
        "Name": "ucx",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "aarch64",
          "x86_64"
        ],
        "Type": "tarball",
        "Version": "1.19.0",
        "Sources": [
          {
            "Architecture": "aarch64",
            "Uri": "https://github.com/openucx/ucx/releases/download/v1.19.0/ucx-1.19.0.tar.gz"
          },
          {
            "Architecture": "x86_64",
            "Uri": "https://github.com/openucx/ucx/releases/download/v1.19.0/ucx-1.19.0.tar.gz"
          }
        ]
      },
      "os_package_id_99": {
        "Name": "docker.io/dellhpcomniaaisolution/image-build-el10",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "1.1",
        "Version": "1.1"
      }
    },
    "Miscellaneous": [],
    "InfrastructurePackages": {}
  }
}

================================================
FILE: examples/catalog/catalog_rhel_x86_64_with_slurm_only.json
================================================
{
  "Catalog": {
    "Name": "Catalog",
    "Version": "1.0",
    "Identifier": "image-build",
    "FunctionalLayer": [
      {
        "Name": "login_compiler_node_x86_64",
        "FunctionalPackages": [
          "package_id_1",
          "package_id_16",
          "package_id_2",
          "package_id_22",
          "package_id_3",
          "package_id_4",
          "package_id_5",
          "package_id_6",
          "package_id_7"
        ]
      },
      {
        "Name": "login_node_x86_64",
        "FunctionalPackages": [
          "package_id_1",
          "package_id_16",
          "package_id_2",
          "package_id_22",
          "package_id_3",
          "package_id_4",
          "package_id_5",
          "package_id_6",
          "package_id_7"
        ]
      },
      {
        "Name": "slurm_control_node_x86_64",
        "FunctionalPackages": [
          "package_id_1",
          "package_id_10",
          "package_id_11",
          "package_id_12",
          "package_id_13",
          "package_id_14",
          "package_id_15",
          "package_id_2",
          "package_id_3",
          "package_id_4",
          "package_id_5",
          "package_id_6",
          "package_id_7",
          "package_id_8",
          "package_id_9"
        ]
      },
      {
        "Name": "slurm_node_x86_64",
        "FunctionalPackages": [
          "package_id_1",
          "package_id_16",
          "package_id_17",
          "package_id_18",
          "package_id_19",
          "package_id_2",
          "package_id_20",
          "package_id_21",
          "package_id_3",
          "package_id_4",
          "package_id_5",
          "package_id_6",
          "package_id_7"
        ]
      }
    ],
    "BaseOS": [
      {
        "Name": "RHEL",
        "Version": "10.0",
        "osPackages": [
          "os_package_id_1",
          "os_package_id_10",
          "os_package_id_11",
          "os_package_id_12",
          "os_package_id_13",
          "os_package_id_14",
          "os_package_id_15",
          "os_package_id_16",
          "os_package_id_17",
          "os_package_id_18",
          "os_package_id_19",
          "os_package_id_2",
          "os_package_id_20",
          "os_package_id_21",
          "os_package_id_22",
          "os_package_id_23",
          "os_package_id_24",
          "os_package_id_25",
          "os_package_id_26",
          "os_package_id_27",
          "os_package_id_28",
          "os_package_id_29",
          "os_package_id_3",
          "os_package_id_30",
          "os_package_id_31",
          "os_package_id_32",
          "os_package_id_33",
          "os_package_id_34",
          "os_package_id_35",
          "os_package_id_36",
          "os_package_id_37",
          "os_package_id_38",
          "os_package_id_39",
          "os_package_id_4",
          "os_package_id_40",
          "os_package_id_41",
          "os_package_id_42",
          "os_package_id_43",
          "os_package_id_44",
          "os_package_id_45",
          "os_package_id_46",
          "os_package_id_47",
          "os_package_id_48",
          "os_package_id_49",
          "os_package_id_5",
          "os_package_id_50",
          "os_package_id_51",
          "os_package_id_52",
          "os_package_id_53",
          "os_package_id_54",
          "os_package_id_55",
          "os_package_id_56",
          "os_package_id_57",
          "os_package_id_58",
          "os_package_id_59",
          "os_package_id_6",
          "os_package_id_60",
          "os_package_id_61",
          "os_package_id_62",
          "os_package_id_63",
          "os_package_id_64",
          "os_package_id_65",
          "os_package_id_66",
          "os_package_id_67",
          "os_package_id_68",
          "os_package_id_69",
          "os_package_id_7",
          "os_package_id_70",
          "os_package_id_71",
          "os_package_id_72",
          "os_package_id_73",
          "os_package_id_74",
          "os_package_id_75",
          "os_package_id_76",
          "os_package_id_77",
          "os_package_id_78",
          "os_package_id_79",
          "os_package_id_8",
          "os_package_id_80",
          "os_package_id_81",
          "os_package_id_82",
          "os_package_id_83",
          "os_package_id_84",
          "os_package_id_85",
          "os_package_id_86",
          "os_package_id_87",
          "os_package_id_88",
          "os_package_id_89",
          "os_package_id_9",
          "os_package_id_90",
          "os_package_id_91"
        ]
      }
    ],
    "Infrastructure": [],
    "Drivers": [],
    "DriverPackages": {},
    "FunctionalPackages": {
      "package_id_1": {
        "Name": "munge",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_2": {
        "Name": "firewalld",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "package_id_3": {
        "Name": "python3-firewall",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "package_id_4": {
        "Name": "pmix",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_5": {
        "Name": "nvcr.io/nvidia/hpc-benchmarks",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "25.09",
        "Version": "25.09"
      },
      "package_id_6": {
        "Name": "apptainer",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "epel"
          }
        ]
      },
      "package_id_7": {
        "Name": "doca-ofed",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm_repo",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "doca"
          }
        ]
      },
      "package_id_8": {
        "Name": "slurm-slurmctld",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_slurm_custom"
          }
        ]
      },
      "package_id_9": {
        "Name": "slurm-slurmdbd",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_slurm_custom"
          }
        ]
      },
      "package_id_10": {
        "Name": "python3-PyMySQL",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_11": {
        "Name": "mariadb-server",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_12": {
        "Name": "iscsi-initiator-utils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "package_id_13": {
        "Name": "device-mapper-multipath",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "package_id_14": {
        "Name": "sg3_utils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "package_id_15": {
        "Name": "lsscsi",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "package_id_16": {
        "Name": "slurm-slurmd",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_slurm_custom"
          }
        ]
      },
      "package_id_17": {
        "Name": "slurm-pam_slurm",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_slurm_custom"
          }
        ]
      },
      "package_id_18": {
        "Name": "kernel-devel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_19": {
        "Name": "kernel-headers",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "package_id_20": {
        "Name": "cuda-run",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "iso",
        "Sources": [
          {
            "Architecture": "x86_64",
            "Uri": "https://developer.download.nvidia.com/compute/cuda/13.0.2/local_installers/cuda_13.0.2_580.95.05_linux.run"
          }
        ]
      },
      "package_id_21": {
        "Name": "nvhpc_2025_2511_Linux_x86_64_cuda_13.0",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "tarball",
        "Sources": [
          {
            "Architecture": "x86_64",
            "Uri": "https://developer.download.nvidia.com/hpc-sdk/25.11/nvhpc_2025_2511_Linux_x86_64_cuda_13.0.tar.gz"
          }
        ]
      },
      "package_id_22": {
        "Name": "slurm",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_slurm_custom"
          }
        ]
      }
    },
    "OSPackages": {
      "os_package_id_1": {
        "Name": "which",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_2": {
        "Name": "tcpdump",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_3": {
        "Name": "traceroute",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_4": {
        "Name": "iperf3",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_5": {
        "Name": "fping",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "epel"
          }
        ]
      },
      "os_package_id_6": {
        "Name": "dmidecode",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_7": {
        "Name": "hwloc",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_8": {
        "Name": "hwloc-libs",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_9": {
        "Name": "lshw",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_10": {
        "Name": "pciutils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_11": {
        "Name": "vim-enhanced",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_12": {
        "Name": "emacs",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_13": {
        "Name": "zsh",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_14": {
        "Name": "openssh",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_15": {
        "Name": "openssh-server",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_16": {
        "Name": "openssh-clients",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_17": {
        "Name": "rsync",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_18": {
        "Name": "file",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_19": {
        "Name": "libcurl",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_20": {
        "Name": "tar",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_21": {
        "Name": "bzip2",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_22": {
        "Name": "man-db",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_23": {
        "Name": "man-pages",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_24": {
        "Name": "strace",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_25": {
        "Name": "kexec-tools",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_26": {
        "Name": "openssl-devel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_27": {
        "Name": "ipmitool",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_28": {
        "Name": "gdb",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_29": {
        "Name": "gdb-gdbserver",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_30": {
        "Name": "lldb",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_31": {
        "Name": "lldb-devel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_32": {
        "Name": "valgrind",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_33": {
        "Name": "valgrind-devel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_34": {
        "Name": "ltrace",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_35": {
        "Name": "kernel-tools",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_36": {
        "Name": "perf",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_37": {
        "Name": "papi",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_38": {
        "Name": "papi-devel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_39": {
        "Name": "papi-libs",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_40": {
        "Name": "cmake",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_41": {
        "Name": "make",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_42": {
        "Name": "autoconf",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_43": {
        "Name": "automake",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_44": {
        "Name": "libtool",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_45": {
        "Name": "gcc",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_46": {
        "Name": "gcc-c++",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_47": {
        "Name": "gcc-gfortran",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_48": {
        "Name": "binutils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_49": {
        "Name": "binutils-devel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_50": {
        "Name": "clustershell",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "epel"
          }
        ]
      },
      "os_package_id_51": {
        "Name": "bash-completion",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_52": {
        "Name": "systemd",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_53": {
        "Name": "systemd-udev",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_54": {
        "Name": "kernel",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_55": {
        "Name": "dracut",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_56": {
        "Name": "dracut-live",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_57": {
        "Name": "dracut-network",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_58": {
        "Name": "squashfs-tools",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_59": {
        "Name": "nfs-utils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_60": {
        "Name": "nfs4-acl-tools",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_61": {
        "Name": "NetworkManager",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_62": {
        "Name": "nm-connection-editor",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_63": {
        "Name": "iproute",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_64": {
        "Name": "iputils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_65": {
        "Name": "curl",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_66": {
        "Name": "bash",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_67": {
        "Name": "coreutils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_68": {
        "Name": "grep",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_69": {
        "Name": "sed",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_70": {
        "Name": "gawk",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_71": {
        "Name": "findutils",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_72": {
        "Name": "util-linux",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_73": {
        "Name": "kbd",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_74": {
        "Name": "lsof",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_75": {
        "Name": "cryptsetup",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_76": {
        "Name": "lvm2",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_77": {
        "Name": "device-mapper",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_78": {
        "Name": "rsyslog",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_79": {
        "Name": "chrony",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_80": {
        "Name": "sudo",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_81": {
        "Name": "gzip",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_82": {
        "Name": "wget",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_83": {
        "Name": "cloud-init",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_84": {
        "Name": "glibc-langpack-en",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_85": {
        "Name": "gedit",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "epel"
          }
        ]
      },
      "os_package_id_86": {
        "Name": "docker.io/dellhpcomniaaisolution/image-build-el10",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "image",
        "Tag": "1.1",
        "Version": "1.1"
      },
      "os_package_id_87": {
        "Name": "openldap-clients",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_88": {
        "Name": "nss-pam-ldapd",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "epel"
          }
        ]
      },
      "os_package_id_89": {
        "Name": "sssd",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      },
      "os_package_id_90": {
        "Name": "oddjob-mkhomedir",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_appstream"
          }
        ]
      },
      "os_package_id_91": {
        "Name": "authselect",
        "SupportedOS": [
          {
            "Name": "RHEL",
            "Version": "10.0"
          }
        ],
        "Architecture": [
          "x86_64"
        ],
        "Type": "rpm",
        "Sources": [
          {
            "Architecture": "x86_64",
            "RepoName": "x86_64_baseos"
          }
        ]
      }
    },
    "Miscellaneous": [],
    "InfrastructurePackages": {}
  }
}

================================================
FILE: examples/catalog/mapping_file_software_config/catalog_rhel_aarch64_with_slurm_only_json/pxe_mapping_file.csv
================================================
FUNCTIONAL_GROUP_NAME,GROUP_NAME,SERVICE_TAG,PARENT_SERVICE_TAG,HOSTNAME,ADMIN_MAC,ADMIN_IP,BMC_MAC,BMC_IP
slurm_control_node_x86_64,grp0,ABCD12,,slurm-control-node1,xx:yy:zz:aa:bb:cc,172.16.107.52,xx:yy:zz:aa:bb:dd,172.17.107.52
slurm_node_aarch64,grp1,ABCD34,ABFL82,slurm-node1,aa:bb:cc:dd:ee:ff,172.16.107.43,aa:bb:cc:dd:ee:gg,172.17.107.43
slurm_node_aarch64,grp2,ABFG34,ABKD88,slurm-node2,aa:bb:cc:dd:ee:ff,172.16.107.44,aa:bb:cc:dd:ff:gg,172.17.107.44
login_compiler_node_aarch64,grp8,ABCD78,,login-compiler-node1,aa:bb:cc:dd:ee:gg,172.16.107.41,aa:bb:cc:dd:ee:bb,172.17.107.41
login_node_x86_64,grp9,ABFG78,,login-node1,aa:bb:cc:dd:ee:gg,172.16.107.42,aa:bb:cc:dd:ee:bb,172.17.107.42

================================================
FILE: examples/catalog/mapping_file_software_config/catalog_rhel_aarch64_with_slurm_only_json/software_config.json
================================================
{
    "cluster_os_type": "rhel",
    "cluster_os_version": "10.0",
    "repo_config": "always",
    "softwares": [
        {"name": "default_packages", "arch": ["x86_64", "aarch64"]},
        {"name": "admin_debug_packages", "arch": ["x86_64", "aarch64"]},
        {"name": "openldap", "arch": ["x86_64", "aarch64"]},
        {"name": "slurm_custom", "arch": ["x86_64", "aarch64"]}
    ],
    "slurm_custom": [
        {"name": "slurm_control_node"},
        {"name": "slurm_node"},
        {"name": "login_node"},
        {"name": "login_compiler_node"}
    ]
}


================================================
FILE: examples/catalog/mapping_file_software_config/catalog_rhel_json/pxe_mapping_file.csv
================================================
FUNCTIONAL_GROUP_NAME,GROUP_NAME,SERVICE_TAG,PARENT_SERVICE_TAG,HOSTNAME,ADMIN_MAC,ADMIN_IP,BMC_MAC,BMC_IP
slurm_control_node_x86_64,grp0,ABCD12,,slurm-control-node1,xx:yy:zz:aa:bb:cc,172.16.107.52,xx:yy:zz:aa:bb:dd,172.17.107.52
slurm_node_aarch64,grp1,ABCD34,ABFL82,slurm-node1,aa:bb:cc:dd:ee:ff,172.16.107.43,aa:bb:cc:dd:ee:gg,172.17.107.43
slurm_node_aarch64,grp2,ABFG34,ABKD88,slurm-node2,aa:bb:cc:dd:ee:ff,172.16.107.44,aa:bb:cc:dd:ff:gg,172.17.107.44
login_compiler_node_aarch64,grp8,ABCD78,,login-compiler-node1,aa:bb:cc:dd:ee:gg,172.16.107.41,aa:bb:cc:dd:ee:bb,172.17.107.41
login_node_x86_64,grp9,ABFG78,,login-node1,aa:bb:cc:dd:ee:gg,172.16.107.42,aa:bb:cc:dd:ee:bb,172.17.107.42
service_kube_control_plane_x86_64,grp3,ABFG79,,service-kube-control-plane1,aa:bb:cc:dd:ee:ff,172.16.107.53,xx:yy:zz:aa:bb:ff,172.17.107.53
service_kube_control_plane_x86_64,grp4,ABFH78,,service-kube-control-plane2,aa:bb:cc:dd:ee:hh,172.16.107.54,xx:yy:zz:aa:bb:hh,172.17.107.54
service_kube_control_plane_x86_64,grp4,ABFH80,,service-kube-control-plane3,aa:bb:cc:dd:ee:ii,172.16.107.55,xx:yy:zz:aa:bb:ii,172.17.107.55
service_kube_node_x86_64,grp5,ABFL82,,service-kube-node1,aa:bb:cc:dd:ee:jj,172.16.107.56,xx:yy:zz:aa:bb:jj,172.17.107.56
service_kube_node_x86_64,grp5,ABKD88,,service-kube-node2,aa:bb:cc:dd:ee:kk,172.16.107.57,xx:yy:zz:aa:bb:ff,172.17.107.57

================================================
FILE: examples/catalog/mapping_file_software_config/catalog_rhel_json/software_config.json
================================================
{
    "cluster_os_type": "rhel",
    "cluster_os_version": "10.0",
    "repo_config": "always",
    "softwares": [
        {"name": "default_packages", "arch": ["x86_64","aarch64"]},
        {"name": "admin_debug_packages", "arch": ["x86_64","aarch64"]},
        {"name": "openldap", "arch": ["x86_64","aarch64"]},
        {"name": "service_k8s","version": "1.34.1", "arch": ["x86_64"]},
        {"name": "slurm_custom", "arch": ["x86_64","aarch64"]},
        {"name": "ldms", "arch": ["x86_64","aarch64"]}
    ],
    "slurm_custom": [
        {"name": "slurm_control_node"},
        {"name": "slurm_node"},
        {"name": "login_node"},
        {"name": "login_compiler_node"}
    ],
    "service_k8s": [
        {"name": "service_kube_control_plane_first"},
        {"name": "service_kube_control_plane"},
        {"name": "service_kube_node"}
    ],
    "additional_packages":[
        {"name": "service_kube_control_plane_first"},
        {"name": "service_kube_control_plane"},
        {"name": "service_kube_node"},
        {"name": "slurm_control_node"},
        {"name": "slurm_node"},
        {"name": "login_node"},
        {"name": "login_compiler_node"}
    ]

}


================================================
FILE: examples/catalog/mapping_file_software_config/catalog_rhel_with_ucx_openmpi_json/pxe_mapping_file.csv
================================================
FUNCTIONAL_GROUP_NAME,GROUP_NAME,SERVICE_TAG,PARENT_SERVICE_TAG,HOSTNAME,ADMIN_MAC,ADMIN_IP,BMC_MAC,BMC_IP
slurm_control_node_x86_64,grp0,ABCD12,,slurm-control-node1,xx:yy:zz:aa:bb:cc,172.16.107.52,xx:yy:zz:aa:bb:dd,172.17.107.52
slurm_node_aarch64,grp1,ABCD34,ABFL82,slurm-node1,aa:bb:cc:dd:ee:ff,172.16.107.43,aa:bb:cc:dd:ee:gg,172.17.107.43
slurm_node_aarch64,grp2,ABFG34,ABKD88,slurm-node2,aa:bb:cc:dd:ee:ff,172.16.107.44,aa:bb:cc:dd:ff:gg,172.17.107.44
login_compiler_node_aarch64,grp8,ABCD78,,login-compiler-node1,aa:bb:cc:dd:ee:gg,172.16.107.41,aa:bb:cc:dd:ee:bb,172.17.107.41
login_node_x86_64,grp9,ABFG78,,login-node1,aa:bb:cc:dd:ee:gg,172.16.107.42,aa:bb:cc:dd:ee:bb,172.17.107.42
service_kube_control_plane_x86_64,grp3,ABFG79,,service-kube-control-plane1,aa:bb:cc:dd:ee:ff,172.16.107.53,xx:yy:zz:aa:bb:ff,172.17.107.53
service_kube_control_plane_x86_64,grp4,ABFH78,,service-kube-control-plane2,aa:bb:cc:dd:ee:hh,172.16.107.54,xx:yy:zz:aa:bb:hh,172.17.107.54
service_kube_control_plane_x86_64,grp4,ABFH80,,service-kube-control-plane3,aa:bb:cc:dd:ee:ii,172.16.107.55,xx:yy:zz:aa:bb:ii,172.17.107.55
service_kube_node_x86_64,grp5,ABFL82,,service-kube-node1,aa:bb:cc:dd:ee:jj,172.16.107.56,xx:yy:zz:aa:bb:jj,172.17.107.56
service_kube_node_x86_64,grp5,ABKD88,,service-kube-node2,aa:bb:cc:dd:ee:kk,172.16.107.57,xx:yy:zz:aa:bb:ff,172.17.107.57

================================================
FILE: examples/catalog/mapping_file_software_config/catalog_rhel_with_ucx_openmpi_json/software_config.json
================================================
{
    "cluster_os_type": "rhel",
    "cluster_os_version": "10.0",
    "repo_config": "always",
    "softwares": [
        {"name": "default_packages", "arch": ["x86_64","aarch64"]},
        {"name": "admin_debug_packages", "arch": ["x86_64","aarch64"]},
        {"name": "openldap", "arch": ["x86_64","aarch64"]},
        {"name": "service_k8s","version": "1.34.1", "arch": ["x86_64"]},
        {"name": "slurm_custom", "arch": ["x86_64","aarch64"]},
        {"name": "ldms", "arch": ["x86_64","aarch64"]},
        {"name": "ucx", "version": "1.19.0", "arch": ["x86_64","aarch64"]},
        {"name": "openmpi", "version": "5.0.8", "arch": ["x86_64","aarch64"]}
    ],
    "slurm_custom": [
        {"name": "slurm_control_node"},
        {"name": "slurm_node"},
        {"name": "login_node"},
        {"name": "login_compiler_node"}
    ],
    "service_k8s": [
        {"name": "service_kube_control_plane_first"},
        {"name": "service_kube_control_plane"},
        {"name": "service_kube_node"}
    ],
    "additional_packages":[
        {"name": "service_kube_control_plane_first"},
        {"name": "service_kube_control_plane"},
        {"name": "service_kube_node"},
        {"name": "slurm_control_node"},
        {"name": "slurm_node"},
        {"name": "login_node"},
        {"name": "login_compiler_node"}
    ]

}


================================================
FILE: examples/catalog/mapping_file_software_config/catalog_rhel_x86_64_with_slurm_only_json/pxe_mapping_file.csv
================================================
FUNCTIONAL_GROUP_NAME,GROUP_NAME,SERVICE_TAG,PARENT_SERVICE_TAG,HOSTNAME,ADMIN_MAC,ADMIN_IP,BMC_MAC,BMC_IP
slurm_control_node_x86_64,grp0,ABCD12,,slurm-control-node1,xx:yy:zz:aa:bb:cc,172.16.107.52,xx:yy:zz:aa:bb:dd,172.17.107.52
slurm_node_x86_64,grp1,ABCD34,ABFL82,slurm-node1,aa:bb:cc:dd:ee:ff,172.16.107.43,aa:bb:cc:dd:ee:gg,172.17.107.43
slurm_node_x86_64,grp2,ABFG34,ABKD88,slurm-node2,aa:bb:cc:dd:ee:ff,172.16.107.44,aa:bb:cc:dd:ff:gg,172.17.107.44
login_compiler_node_x86_64,grp8,ABCD78,,login-compiler-node1,aa:bb:cc:dd:ee:gg,172.16.107.41,aa:bb:cc:dd:ee:bb,172.17.107.41
login_node_x86_64,grp9,ABFG78,,login-node1,aa:bb:cc:dd:ee:gg,172.16.107.42,aa:bb:cc:dd:ee:bb,172.17.107.42

================================================
FILE: examples/catalog/mapping_file_software_config/catalog_rhel_x86_64_with_slurm_only_json/software_config.json
================================================
{
    "cluster_os_type": "rhel",
    "cluster_os_version": "10.0",
    "repo_config": "always",
    "softwares": [
        {"name": "default_packages", "arch": ["x86_64"]},
        {"name": "admin_debug_packages", "arch": ["x86_64"]},
        {"name": "openldap", "arch": ["x86_64"]},
        {"name": "slurm_custom", "arch": ["x86_64"]}
    ],
    "slurm_custom": [
        {"name": "slurm_control_node"},
        {"name": "slurm_node"},
        {"name": "login_node"},
        {"name": "login_compiler_node"}
    ]
}


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/with_service_k8s/only_login_compiler_node/high_availability_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# ***********************************************************************
# High Availability (HA) Configuration for Kubernetes (K8s) Service Node(List)
# - cluster_name is required field it should match one of the values defined in omnia_config.yml where deployment is set to true.
# - enable_k8s_ha: <Mandatory> Indicates whether to enable HA for the Kubernetes (K8s) service node. Set to 'true' to enable, 'false' to disable.
# - virtual_ip_address: <Mandatory if enable_k8s_ha is true> The virtual IP address for the K8s service node HA setup.
# ***********************************************************************

service_k8s_cluster_ha:
  - cluster_name: service_cluster
    enable_k8s_ha: true
    virtual_ip_address: "172.16.107.1"

================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/with_service_k8s/only_login_compiler_node/local_repo_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# You may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# ================================
# VARIABLE DETAILS
# ================================
# 1. user_repo_url_x86_64
#--------------------------
#    Optional list of user-defined repository URLs for x86_64 architecture.
#    Each entry can include: url, gpgkey, sslcacert, sslclientkey, sslclientcert, name, policy.
#    Used for custom cluster packages like <arch>_slurm_custom.
# Fields:
#   url         : Base URL of the repository
#   gpgkey      : GPG key URL (leave empty to disable gpgcheck; Omnia will trust this repo and user is responsible for its security)
#   name        : Name of the repository
#   sslcacert   : Path to SSL CA certificate (if using SSL)
#   sslclientkey: Path to SSL client key (if using SSL)
#   sslclientcert: Path to SSL client certificate (if using SSL)
#   policy      : Repository policy (always, partial)
# Notes:
#   - Do not use Jinja variables in this configuration.
#   - Omit SSL fields entirely if SSL is not in use.
#   - Its a madatory field in case of slurm_custom with name as '<arch>_slurm_custom'
#
# 2. user_repo_url_aarch64
#---------------------------
#    Same as above but for aarch64 architecture.
#
# 4. rhel_os_url_x86_64
#-----------------------------
#    Mandatory when RHEL subscription is not registered.
#    Contains repository URLs for codeready-builder, baseos, and appstream for x86_64.
# Fields:
#   url         : Base URL of the repository
#   gpgkey      : GPG key URL (leave empty to disable gpgcheck; Omnia will trust this repo and user is responsible for its security)
#   sslcacert   : Path to SSL CA certificate (if using SSL)
#   sslclientkey: Path to SSL client key (if using SSL)
#   sslclientcert: Path to SSL client certificate (if using SSL)
#   policy      : Repository policy if mentioned allowed values (always, partial). IF not mentioned will consider from software_config.json
#   name        : Name of the repository [ Allowed repo names <arch>_codeready-builder, <arch>_appstream, <arch>_baseos
# Notes:
#   - Do not use Jinja variables in this configuration.
#   - Omit SSL fields entirely if SSL is not in use.
#   - RHEL subscription is not registered, All 3 repositories [ <arch>_codeready-builder, <arch>_appstream, <arch>_baseos ]entries
#      are mandatory.
#
# 5. rhel_os_url_aarch64
#----------------------------
#    Same as above but for aarch64 architecture.
#
#### ADVANCE CONFIGURATIONS FOR LOCAL REPO ###
# 6. omnia_repo_url_rhel_x86_64
#-------------------------------
#    Mandatory repository URLs for downloading RPMS for Omnia features on RHEL x86_64.
#    Each entry includes url, gpgkey, and name.
#
# This variable defines all the repo urls from where rpms will be downloaded for omnia features when cluster_os_type is rhel and arch x86_64
# Making incorrect changes to this variable can cause omnia failure. Please edit cautiously.
# Fields:
#  url        : Base URL of the repository.
#  gpgkey     : URL of the GPG key for the repository.
#                   If left empty, gpgcheck=0 for that repository.
#  name       : A unique identifier for the repository or registry.
#
# 7. omnia_repo_url_rhel_aarch64
#--------------------------------
#    Same as above but for RHEL aarch64.

# ================================
# VARIABLES
# ================================
# Example    
# user_repo_url_x86_64:
#  - { url: "", gpgkey: "", sslcacert: "", sslclientkey: "", sslclientcert: "",  name: "x86_64_slurm_custom" }
user_repo_url_x86_64:
user_repo_url_aarch64:
#Example:
# rhel_os_url_x86_64:
#  - { url: "http://crb.com/CRB/x86_64/os/", gpgkey: "http://crb.com/CRB/x86_64/os/RPM-GPG-KEY", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "x86_64_codeready-builder"}
#  - { url: "http://BaseOS.com/BaseOS/x86_64/os/", gpgkey: "http://BaseOS.com/BaseOS/x86_64/os/RPM-GPG-KEY", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "x86_64_baseos"}
#  - { url: "http://AppStream.com/AppStream/x86_64/os/", gpgkey: "http://AppStream.com/AppStream/x86_64/os/RPM-GPG-KEY", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "x86_64_appstream" }
rhel_os_url_x86_64:
rhel_os_url_aarch64:
# Making incorrect changes to this variable can cause omnia failure. Please edit cautiously.
omnia_repo_url_rhel_x86_64:
  - { url: "https://download.docker.com/linux/centos/10/x86_64/stable/", gpgkey: "https://download.docker.com/linux/centos/gpg", name: "docker-ce"}
  - { url: "https://dl.fedoraproject.org/pub/epel/10/Everything/x86_64/", gpgkey: "https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-10", name: "epel"}
  - { url: "https://pkgs.k8s.io/core:/stable:/v1.34/rpm/", gpgkey: "https://pkgs.k8s.io/core:/stable:/v1.34/rpm/repodata/repomd.xml.key", name: "kubernetes"}
  - { url: "https://download.opensuse.org/repositories/isv:/cri-o:/stable:/v1.34/rpm/", gpgkey: "https://download.opensuse.org/repositories/isv:/cri-o:/stable:/v1.34/rpm/repodata/repomd.xml.key'", name: "cri-o"}
omnia_repo_url_rhel_aarch64:
  - { url: "https://download.docker.com/linux/centos/10/aarch64/stable/", gpgkey: "https://download.docker.com/linux/centos/gpg", name: "docker-ce"}
  - { url: "https://dl.fedoraproject.org/pub/epel/10/Everything/aarch64/", gpgkey: "https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-10", name: "epel"}


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/with_service_k8s/only_login_compiler_node/network_spec.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# This file is used to specify the network configuration.
#
# 'admin_network' is a mandatory field, essential for PXE boot and host communication."
#
# The 'admin_network' section contains the following variables:
# - 'oim_nic_name': The name of the interface on the OIM server associated with the admin network.
# - 'netmask_bits': The number of bits in the subnet mask.
# - 'primary_oim_admin_ip': The admin IP address of the OIM server which is configured.
# - 'primary_oim_bmc_ip': The iDRAC  IP address of the OIM server,
#     Mandatory only if idrac_telemetry is set to true and telemetry data needs to be collected from the OIM server.
#     Optional — can be omitted if iDRAC telemetry for the OIM server is not required.
# - 'dynamic_range': The range of dynamic IP addresses available on the admin network.
# - 'dns': The list of external DNS server IP address for the admin network.
# - 'ntp_servers': The list of NTP servers for the admin network. Each NTP server entry should include: 
#     - 'address': The IP address or hostname of the NTP server.
#     - 'type': The type of NTP entry, either 'server' or 'pool'.
#     Example:  
#     ntp_servers:
#       - { address: "172.16.10.80", type: "server" }

Networks:
- admin_network:
    oim_nic_name: "eno1"
    netmask_bits: "24"
    primary_oim_admin_ip: "172.16.107.254"
    primary_oim_bmc_ip: "" 
    dynamic_range: "172.16.107.201-172.16.107.250"
    dns: []
    ntp_servers: []


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/with_service_k8s/only_login_compiler_node/omnia_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# -----------------------------SLURM------------------------------------------------
# slurm_cluster
# List of slurm clusters
# cluster_name is required field

# nfs_storage_name
# Storage name corresponding to the NFS share to be used by slurm cluster 
# This should match with exactly with a entry in storage_config.yml

# config_sources
# defines how the Slurm configuration files are provided to the cluster.
# <conf name>: 
#    <mapping>
# <mapping> Supply the configuration values directly as a key–value map
# The conf files supported by slurm are
# slurm
# cgroup
# gres
# mpi
# helpers
# job_container
# acct_gather
# oci
# plugstack
# topology
# Thes files will be written into the slurm_config directory with .conf suffix

slurm_cluster:
  - cluster_name: slurm_cluster
    nfs_storage_name: nfs_slurm
    # config_sources:
    #   slurm:
    #     SlurmctldTimeout: 60
    #     SlurmdTimeout: 150
    #   cgroup: 
    #     CgroupPlugin: autodetect
    #     AllowedRAMSpace: 100
  
# ----------------------------SERVICE K8S------------------------------------------------------
# For service k8s cluster below parameters are required,(List)
# - cluster_name is required field

# - deployment: Exactly one entry in both the service_k8s_cluster lists must have deployment set to true to indicate where Kubernetes should be deployed.
# Please ensure corresponding cluster entry is added to high_availability_config.yml if deployment is set to true. 

# - Kubernetes SDN network.K8s_cni (Mandatory) - It can either be "calico" or "flannel".Default value assigned is "calico".
# While setting up Kubernetes plugin for RoCE NIC, ensure that this value is set to "flannel"

# - pod_external_ip_range: (Mandatory) These addresses will be used by Loadbalancer for assigning External IPs to K8s services
# Make sure the IP range is not assigned to any node in the cluster.
# Acceptable formats: "10.11.0.100-10.11.0.150" , "10.11.0.0/16"

# - k8s_service_addresses: Kubernetes internal network for services.This network must be unused in your network infrastructure.
# Default value is "10.233.0.0/18"

# - k8s_pod_network_cidr: Kubernetes pod network CIDR for internal network. When used, it will assign IP addresses from this range to individual pods.
# This network must be unused in your network infrastructure.
# Default value is "10.233.64.0/18"

# nfs_storage_name : The nfs name should be same as one of the nfs name defined in storage_config.yml to configure the server.
# ----------------------------CSI Driver------------------------------------------------------
# Following csi powerscale driver input variables are mandatory only if csi_driver_powerscale entry is present in software_config.json
# csi_powerscale_driver_secret_file_path: Absolute file path for the secret.yaml file.
# User need to download secret.yaml file and fill required data in secret file. Provided the path of the secret file here.
# File path for the values.yml file which will contain the Powerscale driver configuration parameters.
# csi_powerscale_driver_values_file_path: User need to download values.yaml file and fill required data in values.yaml file. Provided the path of the values.yaml file here.
# mention configurable values

service_k8s_cluster:
  - cluster_name: service_cluster
    deployment: true
    k8s_cni: "calico"
    pod_external_ip_range: "172.16.107.170-172.16.107.200"
    k8s_service_addresses: "10.233.0.0/18"
    k8s_pod_network_cidr: "10.233.64.0/18"
    nfs_storage_name: "nfs_k8s"
    csi_powerscale_driver_secret_file_path: ""
    csi_powerscale_driver_values_file_path: ""


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/with_service_k8s/only_login_compiler_node/provision_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

#### Mandatory
# This depicts the path where user has kept the PXE mapping file.
# The mapping file consists of the Service tag, Admin MAC,Hostname and its respective admin IP address and/or BMC IP.
# Ensure that admin IPs given in mapping file are within the network defined in the network_spec.yml
# A templates for mapping file exists in omnia/examples, namely, pxe_mapping_file.csv
# Format of csv: FUNCTIONAL_GROUP_NAME,GROUP_NAME,SERVICE_TAG,HOSTNAME,ADMIN_MAC,ADMIN_IP,BMC_MAC,BMC_IP
pxe_mapping_file_path: "/opt/omnia/input/project_default/pxe_mapping_file.csv"

#### Mandatory
# Language that needs to be set during OS provisioning.
# Only language supported is "en_US.UTF-8"
language: "en_US.UTF-8"

#### Mandatory
# Default lease time needs to be used by DHCP
# Unit: seconds
# Min: 21600
# Default: 86400
# Max: 31536000
default_lease_time: "86400"


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/with_service_k8s/only_login_compiler_node/security_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# Connection Type options: TLS or SSL
# Default: TLS (validated)
# If TLS: secure OpenLDAP connection occurs on port 389
# If SSL: secure OpenLDAP connection occurs on port 636
ldap_connection_type: "TLS"


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/with_service_k8s/only_login_compiler_node/software_config.json
================================================
{
    "cluster_os_type": "rhel",
    "cluster_os_version": "10.0",
    "repo_config": "partial",
    "softwares": [
        {"name": "default_packages", "arch": ["x86_64","aarch64"]},
        {"name": "openldap", "arch": ["x86_64","aarch64"]},
        {"name": "service_k8s","version": "1.34.1", "arch": ["x86_64"]},
        {"name": "slurm_custom", "arch": ["x86_64","aarch64"]},
        {"name": "ldms", "arch": ["x86_64","aarch64"]}
    ],
    "slurm_custom": [
        {"name": "slurm_control_node"},
        {"name": "slurm_node"},
        {"name": "login_node"},
        {"name": "login_compiler_node"}
    ],
    "service_k8s": [
        {"name": "service_kube_control_plane_first"},
        {"name": "service_kube_control_plane"},
        {"name": "service_kube_node"}
    ]

}


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/with_service_k8s/only_login_compiler_node/storage_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# -----------------------------NFS------------------------------------------------

# This variable is used for mounting NFS share on slurm_control_node, slurm_node, login_node
# This takes a list of dicts with possible keys server_ip, server_share_path, client_share_path, client_mount_options
# In both the cases, the USER must manually update 'server_ip' and 'server_share_path' below with the correct values.
# If mount_option values are empty, NFS client will be mounted with these values "nosuid,rw,sync,hard,intr"
# Its mandatory to provide atleast one entry in nfs_client_params
# Example for single mount file system:
# nfs_client_params:
# nfs_name : str ,Name of the NFS storage resource. The default is "nfs_storage_default".
#     The user can assign any custom string to specify a different NFS storage resource.
# - { server_ip: 10.5.0.101, server_share_path: "/mnt/share", client_share_path: "/home", client_mount_options: "nosuid,rw,sync,hard"}
# Example for supporting multiple mount points:
# nfs_client_params:
# - { server_ip: 198.168.0.1,server_share_path: "/mnt/share1", client_share_path: "/home", client_mount_options: "nosuid,rw,sync,hard"}
# - { server_ip: 198.168.0.2, server_share_path: "/mnt/share2", client_share_path: "/mnt/mount2", client_mount_options: "nosuid,rw,sync,hard"}
# Example for multiple mount file system:
# nfs_client_params:
# - { server_ip: 198.168.0.1, server_share_path: "/mnt/share1", client_share_path: "/mnt/mount1", client_mount_options: "nosuid,rw,sync,hard"}
# - { server_ip: 198.168.0.2, server_share_path: "/mnt/share2", client_share_path: "/mnt/mount2", client_mount_options: "nosuid,rw,sync,hard"}
nfs_client_params:
  - server_ip: "172.16.107.168" # Provide the IP of the NFS server
    server_share_path: "/mnt/share/omnia" # Provide server share path of the NFS Server
    client_share_path: /share_omnia
    client_mount_options: "nosuid,rw,sync,hard,intr"
    nfs_name: nfs_slurm

  - server_ip: "172.16.107.121" # Provide the IP of the NFS server
    server_share_path: "/mnt/share/omnia_k8s" # Provide server share path of the NFS Server
    client_share_path: /share_omnia_k8s
    client_mount_options: "nosuid,rw,sync,hard,intr"
    nfs_name: nfs_k8s


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/with_service_k8s/only_login_compiler_node/telemetry_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# ============================================================================
# TELEMETRY CONFIGURATION OVERVIEW
# ============================================================================
# This file configures telemetry data collection and storage for Dell Omnia.
#
# SECTIONS:
#   1. iDRAC Telemetry    : Hardware metrics from Dell PowerEdge servers
#   2. VictoriaMetrics    : Time-series database for metric storage
#   3. Kafka              : Distributed streaming platform for telemetry data
#   4. LDMS               : Lightweight Distributed Metric Service for compute nodes
#
# ============================================================================
# STORAGE REQUIREMENTS SUMMARY
# ============================================================================
# 
# VICTORIAMETRICS STORAGE:
# ┌─────────────────┬──────────────────┬─────────────────┬──────────────────┐
# │ Deployment Mode │ Per-Pod Storage  │ Number of Pods  │ Total Storage    │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Single-node     │ persistence_size │ 1 pod           │ 1× storage       │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Cluster         │ persistence_size │ 3 vmstorage     │ 3× storage       │
# └─────────────────┴──────────────────┴─────────────────┴──────────────────┘
# Example: 8Gi per pod → Single-node: 8Gi total, Cluster: 24Gi total
#
# KAFKA STORAGE:
# ┌─────────────────┬──────────────────┬─────────────────┬──────────────────┐
# │ Component       │ Per-Pod Storage  │ Number of Pods  │ Total Storage    │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Kafka Broker    │ persistence_size │ 3 pods          │ 3× storage       │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Kafka Controller│ persistence_size │ 3 pods          │ 3× storage       │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ TOTAL KAFKA     │ persistence_size │ 6 pods          │ 6× storage       │
# └─────────────────┴──────────────────┴─────────────────┴──────────────────┘
# Example: 8Gi per pod → 48Gi total Kafka storage
#
# COMBINED STORAGE EXAMPLES:
#   Default (8Gi each): VictoriaMetrics Cluster (24Gi) + Kafka (48Gi) = 72Gi total
#   Single-node mode:   VictoriaMetrics Single (8Gi) + Kafka (48Gi) = 56Gi total
#
# STORAGE OPTIONS:
#   - VictoriaMetrics: Store iDRAC telemetry in time-series database
#   - Kafka: Stream iDRAC and LDMS telemetry to Kafka topics
#   - Both: Store iDRAC in both Victoria and Kafka (recommended)
# ============================================================================

# ============================================================================
# iDRAC TELEMETRY CONFIGURATION
# ============================================================================
# iDRAC telemetry collects hardware metrics from Dell PowerEdge servers.
# Telemetry data can be stored in VictoriaMetrics, Kafka, or both.

# Enable or disable iDRAC telemetry support
# Accepted values: true or false
# Default: true
idrac_telemetry_support: true

# Specify where to store iDRAC telemetry data
# Supported values:
#   - "victoria"        : Store in VictoriaMetrics only
#   - "kafka"           : Store in Kafka only
#   - "victoria,kafka"  : Store in both (recommended)
# Default: "victoria,kafka"
idrac_telemetry_collection_type: "victoria,kafka"

# ============================================================================
# VICTORIAMETRICS CONFIGURATION
# ============================================================================
# VictoriaMetrics is a time-series database for storing telemetry metrics.
# Used for iDRAC telemetry when 'victoria' is enabled in idrac_telemetry_collection_type.
#
# DEPLOYMENT MODES:
#   - single-node: Simple deployment with one pod (suitable for small deployments)
#   - cluster: High-availability deployment with multiple components
#               (recommended for production and large-scale deployments)
victoria_configurations:
  # VictoriaMetrics deployment mode
  # Supported values:
  #   - "single-node" : Simple deployment (1 pod, suitable for dev/test)
  #   - "cluster"     : High-availability deployment (7 pods, recommended for production)
  # Default: "cluster"
  #
  # Cluster Mode Benefits:
  #   - High availability (no single point of failure)
  #   - Horizontal scalability (scale components independently)
  #   - Better performance (4x ingestion, 2x query speed)
  #   - Production-ready architecture
  #
  # Single-Node Benefits:
  #   - Simple setup (fewer resources)
  #   - Suitable for small deployments (<10 nodes)
  #   - Lower resource usage (~4Gi memory vs ~10Gi for cluster)
  deployment_mode: "cluster"

  # The amount of storage allocated for EACH VictoriaMetrics persistent volume.
  # IMPORTANT: Total VictoriaMetrics storage depends on deployment mode:
  #   - Single-node mode: Total storage = persistence_size × 1 pod
  #   - Cluster mode: Total storage = persistence_size × 3 vmstorage pods
  #   - Example (cluster): 8Gi × 3 = 24Gi total VictoriaMetrics storage
  # Accepted values: in the form of "X[Ki|Mi|Gi|Ti|Pi|Ei]"
  # Default: 8Gi (results in 24Gi total storage for cluster mode)
  persistence_size: "8Gi"

  # Duration (in hours) to retain victoria logs before they are deleted.
  # Default: 168 (7 days)
  retention_period: 168

# ============================================================================
# KAFKA CONFIGURATION
# ============================================================================
# Apache Kafka is a distributed streaming platform for storing telemetry data.
# Used for iDRAC telemetry when 'kafka' is enabled in idrac_telemetry_collection_type.
# Also used for LDMS telemetry when LDMS software is configured.
#
# NOTE: Kafka topics are auto-generated based on enabled features:
#   - 'idrac' topic: Required when idrac_telemetry_support=true and 'kafka' is enabled
#   - 'ldms' topic:  Required when LDMS is configured in software_config.json
kafka_configurations:
  # The amount of storage allocated for EACH Kafka persistent volume.
  # IMPORTANT: Total Kafka storage = persistence_size × 6 pods
  #   - 3 Kafka brokers (each gets persistence_size storage)
  #   - 3 Kafka controllers (each gets persistence_size storage)
  #   - Example: 8Gi × 6 = 48Gi total Kafka storage
  # Accepted values: in the form of "X[Ki|Mi|Gi|Ti|Pi|Ei]"
  # Default: 8Gi (results in 48Gi total storage)
  persistence_size: "8Gi"

  # The number of hours to retain Kafka logs before they are deleted.
  # Default: 168 (7 days)
  log_retention_hours: 168

  # The maximum size of Kafka logs (in bytes) before they are deleted.
  # Default: -1 (unlimited)
  log_retention_bytes: -1

  # The maximum size of Kafka log segments (in bytes) before they are deleted.
  # Default: 1073741824 (1 GB)
  log_segment_bytes: 1073741824

  # Kafka Topic Partitions Configuration
  # ----------------------------------------------------------------------------
  # Define the number of partitions for each Kafka topic.
  # Increasing partitions can improve throughput but also increases storage/overhead.
  #
  # IMPORTANT: Topic names are FIXED and cannot be changed.
  #   - Topic names: Only 'idrac' and 'ldms' are allowed
  #   - Configurable: Only partition counts can be modified
  #
  # Topic Requirements (auto-validated):
  #   - 'idrac': Required when idrac_telemetry_support=true and 'kafka' is enabled
  #   - 'ldms':  Required when LDMS software is configured in software_config.json
  #
  # Default partition counts: idrac=1, ldms=2
  topic_partitions:
    - name: "idrac"
      partitions: 1
    - name: "ldms"
      partitions: 2

# ============================================================================
# LDMS (Lightweight Distributed Metric Service) CONFIGURATION
# ============================================================================
# LDMS collects performance metrics from compute nodes (CPU, memory, network, etc.)
# and streams them to Kafka for storage and analysis.
#
# PREREQUISITE: To enable LDMS support, add the following to software_config.json:
#   {
#     "softwares": [
#       {"name": "ldms", "arch": ["x86_64", "aarch64"]}
#     ]
#   }
#
# When LDMS software is configured, the 'ldms' topic MUST be defined in
# kafka_configurations.topic_partitions above.
#
# LDMS Port Configurations
# Aggregator port on service k8s cluster
# Valid range: 6001-6100
# Default: 6001
ldms_agg_port: 6001

# Store daemon port on service k8s cluster
# Can be the same as ldms_agg_port
# Valid range: 6001-6100
# Default: 6001
ldms_store_port: 6001

# Sampler port on compute nodes
# Valid range: 10001-10100
# Default: 10001
ldms_sampler_port: 10001

# LDMS Sampler Plugin Configurations
# ----------------------------------------------------------------------------
# Configure which metrics to collect from compute nodes and collection intervals.
# Each plugin collects specific system metrics.
#
# Parameters:
#   - plugin_name: Name of the LDMS sampler plugin
#   - config_parameters: Plugin-specific configuration (as a single string)
#   - activation_parameters: Collection schedule in MICROSECONDS
#       Format: "interval=<microseconds> offset=<microseconds>"
#       Example: "interval=1000000"         (1000000 microseconds = 1 second)
#                "interval=1000000 offset=0" (1000000 microseconds with no offset)
#
# Available Plugins:
#   - meminfo: Memory usage statistics
#   - procstat2: Process statistics
#   - vmstat: Virtual memory statistics
#   - loadavg: System load average
#   - procnetdev2: Network interface statistics
ldms_sampler_configurations:
  # Memory usage statistics (free, used, buffers, cached, etc.)
  - plugin_name: meminfo
    config_parameters: ""
    activation_parameters: "interval=1000000"  # interval=1000000 microseconds

  # Process statistics (CPU, memory, I/O per process)
  - plugin_name: procstat2
    config_parameters: ""
    activation_parameters: "interval=1000000"  # interval=1000000 microseconds

  # Virtual memory statistics (paging, swapping, memory pressure)
  - plugin_name: vmstat
    config_parameters: ""
    activation_parameters: "interval=1000000"  # interval=1000000 microseconds

  # System load average (1, 5, and 15 minute averages)
  - plugin_name: loadavg
    config_parameters: ""
    activation_parameters: "interval=1000000"  # interval=1000000 microseconds

  # Network interface statistics (bytes, packets, errors, drops per interface)
  # Config parameters (optional):
  #   - ifaces=eth0,eth1: Specific interfaces to monitor
  #   - If not specified, all network interfaces will be monitored
  - plugin_name: procnetdev2
    config_parameters: ""  # Monitor all interfaces
    activation_parameters: "interval=1000000 offset=0"  # interval=1000000 microseconds, offset=0


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/with_service_k8s/only_login_compiler_node/user_registry_credential.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************
# user_registry credential manager
# name: User registry name, name should match exact name provided in local_repo_config.yml
# username: Provide if user registry requires username to authenticate
# password: Provide if user registry requires password to authenticate

user_registry_credential:
  - {name: "", username: "", password: ""}


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/with_service_k8s/only_login_node/high_availability_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# ***********************************************************************
# High Availability (HA) Configuration for Kubernetes (K8s) Service Node(List)
# - cluster_name is required field it should match one of the values defined in omnia_config.yml where deployment is set to true.
# - enable_k8s_ha: <Mandatory> Indicates whether to enable HA for the Kubernetes (K8s) service node. Set to 'true' to enable, 'false' to disable.
# - virtual_ip_address: <Mandatory if enable_k8s_ha is true> The virtual IP address for the K8s service node HA setup.
# ***********************************************************************

service_k8s_cluster_ha:
  - cluster_name: service_cluster
    enable_k8s_ha: true
    virtual_ip_address: "172.16.107.1"

================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/with_service_k8s/only_login_node/local_repo_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# You may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# ================================
# VARIABLE DETAILS
# ================================
# 1. user_repo_url_x86_64
#--------------------------
#    Optional list of user-defined repository URLs for x86_64 architecture.
#    Each entry can include: url, gpgkey, sslcacert, sslclientkey, sslclientcert, name, policy.
#    Used for custom cluster packages like <arch>_slurm_custom.
# Fields:
#   url         : Base URL of the repository
#   gpgkey      : GPG key URL (leave empty to disable gpgcheck; Omnia will trust this repo and user is responsible for its security)
#   name        : Name of the repository
#   sslcacert   : Path to SSL CA certificate (if using SSL)
#   sslclientkey: Path to SSL client key (if using SSL)
#   sslclientcert: Path to SSL client certificate (if using SSL)
#   policy      : Repository policy (always, partial)
# Notes:
#   - Do not use Jinja variables in this configuration.
#   - Omit SSL fields entirely if SSL is not in use.
#   - Its a madatory field in case of slurm_custom with name as '<arch>_slurm_custom'
#
# 2. user_repo_url_aarch64
#---------------------------
#    Same as above but for aarch64 architecture.
#
# 4. rhel_os_url_x86_64
#-----------------------------
#    Mandatory when RHEL subscription is not registered.
#    Contains repository URLs for codeready-builder, baseos, and appstream for x86_64.
# Fields:
#   url         : Base URL of the repository
#   gpgkey      : GPG key URL (leave empty to disable gpgcheck; Omnia will trust this repo and user is responsible for its security)
#   sslcacert   : Path to SSL CA certificate (if using SSL)
#   sslclientkey: Path to SSL client key (if using SSL)
#   sslclientcert: Path to SSL client certificate (if using SSL)
#   policy      : Repository policy if mentioned allowed values (always, partial). IF not mentioned will consider from software_config.json
#   name        : Name of the repository [ Allowed repo names <arch>_codeready-builder, <arch>_appstream, <arch>_baseos
# Notes:
#   - Do not use Jinja variables in this configuration.
#   - Omit SSL fields entirely if SSL is not in use.
#   - RHEL subscription is not registered, All 3 repositories [ <arch>_codeready-builder, <arch>_appstream, <arch>_baseos ]entries
#      are mandatory.
#
# 5. rhel_os_url_aarch64
#----------------------------
#    Same as above but for aarch64 architecture.
#
#### ADVANCE CONFIGURATIONS FOR LOCAL REPO ###
# 6. omnia_repo_url_rhel_x86_64
#-------------------------------
#    Mandatory repository URLs for downloading RPMS for Omnia features on RHEL x86_64.
#    Each entry includes url, gpgkey, and name.
#
# This variable defines all the repo urls from where rpms will be downloaded for omnia features when cluster_os_type is rhel and arch x86_64
# Making incorrect changes to this variable can cause omnia failure. Please edit cautiously.
# Fields:
#  url        : Base URL of the repository.
#  gpgkey     : URL of the GPG key for the repository.
#                   If left empty, gpgcheck=0 for that repository.
#  name       : A unique identifier for the repository or registry.
#
# 7. omnia_repo_url_rhel_aarch64
#--------------------------------
#    Same as above but for RHEL aarch64.

# ================================
# VARIABLES
# ================================
# Example    
# user_repo_url_x86_64:
#  - { url: "", gpgkey: "", sslcacert: "", sslclientkey: "", sslclientcert: "",  name: "x86_64_slurm_custom" }
user_repo_url_x86_64:
user_repo_url_aarch64:
#Example:
# rhel_os_url_x86_64:
#  - { url: "http://crb.com/CRB/x86_64/os/", gpgkey: "http://crb.com/CRB/x86_64/os/RPM-GPG-KEY", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "x86_64_codeready-builder"}
#  - { url: "http://BaseOS.com/BaseOS/x86_64/os/", gpgkey: "http://BaseOS.com/BaseOS/x86_64/os/RPM-GPG-KEY", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "x86_64_baseos"}
#  - { url: "http://AppStream.com/AppStream/x86_64/os/", gpgkey: "http://AppStream.com/AppStream/x86_64/os/RPM-GPG-KEY", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "x86_64_appstream" }
rhel_os_url_x86_64:
rhel_os_url_aarch64:
# Making incorrect changes to this variable can cause omnia failure. Please edit cautiously.
omnia_repo_url_rhel_x86_64:
  - { url: "https://download.docker.com/linux/centos/10/x86_64/stable/", gpgkey: "https://download.docker.com/linux/centos/gpg", name: "docker-ce"}
  - { url: "https://dl.fedoraproject.org/pub/epel/10/Everything/x86_64/", gpgkey: "https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-10", name: "epel"}
  - { url: "https://pkgs.k8s.io/core:/stable:/v1.34/rpm/", gpgkey: "https://pkgs.k8s.io/core:/stable:/v1.34/rpm/repodata/repomd.xml.key", name: "kubernetes"}
  - { url: "https://download.opensuse.org/repositories/isv:/cri-o:/stable:/v1.34/rpm/", gpgkey: "https://download.opensuse.org/repositories/isv:/cri-o:/stable:/v1.34/rpm/repodata/repomd.xml.key'", name: "cri-o"}
omnia_repo_url_rhel_aarch64:
  - { url: "https://download.docker.com/linux/centos/10/aarch64/stable/", gpgkey: "https://download.docker.com/linux/centos/gpg", name: "docker-ce"}
  - { url: "https://dl.fedoraproject.org/pub/epel/10/Everything/aarch64/", gpgkey: "https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-10", name: "epel"}


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/with_service_k8s/only_login_node/network_spec.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# This file is used to specify the network configuration.
#
# 'admin_network' is a mandatory field, essential for PXE boot and host communication."
#
# The 'admin_network' section contains the following variables:
# - 'oim_nic_name': The name of the interface on the OIM server associated with the admin network.
# - 'netmask_bits': The number of bits in the subnet mask.
# - 'primary_oim_admin_ip': The admin IP address of the OIM server which is configured.
# - 'primary_oim_bmc_ip': The iDRAC  IP address of the OIM server,
#     Mandatory only if idrac_telemetry is set to true and telemetry data needs to be collected from the OIM server.
#     Optional — can be omitted if iDRAC telemetry for the OIM server is not required.
# - 'dynamic_range': The range of dynamic IP addresses available on the admin network.
# - 'dns': The list of external DNS server IP address for the admin network.
# - 'ntp_servers': The list of NTP servers for the admin network. Each NTP server entry should include: 
#     - 'address': The IP address or hostname of the NTP server.
#     - 'type': The type of NTP entry, either 'server' or 'pool'.
#     Example:  
#     ntp_servers:
#       - { address: "172.16.10.80", type: "server" }

Networks:
- admin_network:
    oim_nic_name: "eno1"
    netmask_bits: "24"
    primary_oim_admin_ip: "172.16.107.254"
    primary_oim_bmc_ip: "" 
    dynamic_range: "172.16.107.201-172.16.107.250"
    dns: []
    ntp_servers: []


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/with_service_k8s/only_login_node/omnia_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# -----------------------------SLURM------------------------------------------------
# slurm_cluster
# List of slurm clusters
# cluster_name is required field

# nfs_storage_name
# Storage name corresponding to the NFS share to be used by slurm cluster 
# This should match with exactly with a entry in storage_config.yml

# config_sources
# defines how the Slurm configuration files are provided to the cluster.
# <conf name>: 
#    <mapping>
# <mapping> Supply the configuration values directly as a key–value map
# The conf files supported by slurm are
# slurm
# cgroup
# gres
# mpi
# helpers
# job_container
# acct_gather
# oci
# plugstack
# topology
# Thes files will be written into the slurm_config directory with .conf suffix

slurm_cluster:
  - cluster_name: slurm_cluster
    nfs_storage_name: nfs_slurm
    # config_sources:
    #   slurm:
    #     SlurmctldTimeout: 60
    #     SlurmdTimeout: 150
    #   cgroup: 
    #     CgroupPlugin: autodetect
    #     AllowedRAMSpace: 100
  
# ----------------------------SERVICE K8S------------------------------------------------------
# For service k8s cluster below parameters are required,(List)
# - cluster_name is required field

# - deployment: Exactly one entry in both the service_k8s_cluster lists must have deployment set to true to indicate where Kubernetes should be deployed.
# Please ensure corresponding cluster entry is added to high_availability_config.yml if deployment is set to true. 

# - Kubernetes SDN network.K8s_cni (Mandatory) - It can either be "calico" or "flannel".Default value assigned is "calico".
# While setting up Kubernetes plugin for RoCE NIC, ensure that this value is set to "flannel"

# - pod_external_ip_range: (Mandatory) These addresses will be used by Loadbalancer for assigning External IPs to K8s services
# Make sure the IP range is not assigned to any node in the cluster.
# Acceptable formats: "10.11.0.100-10.11.0.150" , "10.11.0.0/16"

# - k8s_service_addresses: Kubernetes internal network for services.This network must be unused in your network infrastructure.
# Default value is "10.233.0.0/18"

# - k8s_pod_network_cidr: Kubernetes pod network CIDR for internal network. When used, it will assign IP addresses from this range to individual pods.
# This network must be unused in your network infrastructure.
# Default value is "10.233.64.0/18"

# nfs_storage_name : The nfs name should be same as one of the nfs name defined in storage_config.yml to configure the server.
# ----------------------------CSI Driver------------------------------------------------------
# Following csi powerscale driver input variables are mandatory only if csi_driver_powerscale entry is present in software_config.json
# csi_powerscale_driver_secret_file_path: Absolute file path for the secret.yaml file.
# User need to download secret.yaml file and fill required data in secret file. Provided the path of the secret file here.
# File path for the values.yml file which will contain the Powerscale driver configuration parameters.
# csi_powerscale_driver_values_file_path: User need to download values.yaml file and fill required data in values.yaml file. Provided the path of the values.yaml file here.
# mention configurable values

service_k8s_cluster:
  - cluster_name: service_cluster
    deployment: true
    k8s_cni: "calico"
    pod_external_ip_range: "172.16.107.170-172.16.107.200"
    k8s_service_addresses: "10.233.0.0/18"
    k8s_pod_network_cidr: "10.233.64.0/18"
    nfs_storage_name: "nfs_k8s"
    csi_powerscale_driver_secret_file_path: ""
    csi_powerscale_driver_values_file_path: ""


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/with_service_k8s/only_login_node/provision_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

#### Mandatory
# This depicts the path where user has kept the PXE mapping file.
# The mapping file consists of the Service tag, Admin MAC,Hostname and its respective admin IP address and/or BMC IP.
# Ensure that admin IPs given in mapping file are within the network defined in the network_spec.yml
# A templates for mapping file exists in omnia/examples, namely, pxe_mapping_file.csv
# Format of csv: FUNCTIONAL_GROUP_NAME,GROUP_NAME,SERVICE_TAG,HOSTNAME,ADMIN_MAC,ADMIN_IP,BMC_MAC,BMC_IP
pxe_mapping_file_path: "/opt/omnia/input/project_default/pxe_mapping_file.csv"

#### Mandatory
# Language that needs to be set during OS provisioning.
# Only language supported is "en_US.UTF-8"
language: "en_US.UTF-8"

#### Mandatory
# Default lease time needs to be used by DHCP
# Unit: seconds
# Min: 21600
# Default: 86400
# Max: 31536000
default_lease_time: "86400"


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/with_service_k8s/only_login_node/security_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# Connection Type options: TLS or SSL
# Default: TLS (validated)
# If TLS: secure OpenLDAP connection occurs on port 389
# If SSL: secure OpenLDAP connection occurs on port 636
ldap_connection_type: "TLS"


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/with_service_k8s/only_login_node/software_config.json
================================================
{
    "cluster_os_type": "rhel",
    "cluster_os_version": "10.0",
    "repo_config": "partial",
    "softwares": [
        {"name": "default_packages", "arch": ["x86_64","aarch64"]},
        {"name": "openldap", "arch": ["x86_64","aarch64"]},
        {"name": "service_k8s","version": "1.34.1", "arch": ["x86_64"]},
        {"name": "slurm_custom", "arch": ["x86_64","aarch64"]},
        {"name": "ldms", "arch": ["x86_64","aarch64"]}
    ],
    "slurm_custom": [
        {"name": "slurm_control_node"},
        {"name": "slurm_node"},
        {"name": "login_node"},
        {"name": "login_compiler_node"}
    ],
    "service_k8s": [
        {"name": "service_kube_control_plane_first"},
        {"name": "service_kube_control_plane"},
        {"name": "service_kube_node"}
    ]

}


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/with_service_k8s/only_login_node/storage_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# -----------------------------NFS------------------------------------------------

# This variable is used for mounting NFS share on slurm_control_node, slurm_node, login_node
# This takes a list of dicts with possible keys server_ip, server_share_path, client_share_path, client_mount_options
# In both the cases, the USER must manually update 'server_ip' and 'server_share_path' below with the correct values.
# If mount_option values are empty, NFS client will be mounted with these values "nosuid,rw,sync,hard,intr"
# Its mandatory to provide atleast one entry in nfs_client_params
# Example for single mount file system:
# nfs_client_params:
# nfs_name : str ,Name of the NFS storage resource. The default is "nfs_storage_default".
#     The user can assign any custom string to specify a different NFS storage resource.
# - { server_ip: 10.5.0.101, server_share_path: "/mnt/share", client_share_path: "/home", client_mount_options: "nosuid,rw,sync,hard"}
# Example for supporting multiple mount points:
# nfs_client_params:
# - { server_ip: 198.168.0.1,server_share_path: "/mnt/share1", client_share_path: "/home", client_mount_options: "nosuid,rw,sync,hard"}
# - { server_ip: 198.168.0.2, server_share_path: "/mnt/share2", client_share_path: "/mnt/mount2", client_mount_options: "nosuid,rw,sync,hard"}
# Example for multiple mount file system:
# nfs_client_params:
# - { server_ip: 198.168.0.1, server_share_path: "/mnt/share1", client_share_path: "/mnt/mount1", client_mount_options: "nosuid,rw,sync,hard"}
# - { server_ip: 198.168.0.2, server_share_path: "/mnt/share2", client_share_path: "/mnt/mount2", client_mount_options: "nosuid,rw,sync,hard"}
nfs_client_params:
  - server_ip: "172.16.107.168" # Provide the IP of the NFS server
    server_share_path: "/mnt/share/omnia" # Provide server share path of the NFS Server
    client_share_path: /share_omnia
    client_mount_options: "nosuid,rw,sync,hard,intr"
    nfs_name: nfs_slurm

  - server_ip: "172.16.107.121" # Provide the IP of the NFS server
    server_share_path: "/mnt/share/omnia_k8s" # Provide server share path of the NFS Server
    client_share_path: /share_omnia_k8s
    client_mount_options: "nosuid,rw,sync,hard,intr"
    nfs_name: nfs_k8s


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/with_service_k8s/only_login_node/telemetry_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# ============================================================================
# TELEMETRY CONFIGURATION OVERVIEW
# ============================================================================
# This file configures telemetry data collection and storage for Dell Omnia.
#
# SECTIONS:
#   1. iDRAC Telemetry    : Hardware metrics from Dell PowerEdge servers
#   2. VictoriaMetrics    : Time-series database for metric storage
#   3. Kafka              : Distributed streaming platform for telemetry data
#   4. LDMS               : Lightweight Distributed Metric Service for compute nodes
#
# ============================================================================
# STORAGE REQUIREMENTS SUMMARY
# ============================================================================
# 
# VICTORIAMETRICS STORAGE:
# ┌─────────────────┬──────────────────┬─────────────────┬──────────────────┐
# │ Deployment Mode │ Per-Pod Storage  │ Number of Pods  │ Total Storage    │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Single-node     │ persistence_size │ 1 pod           │ 1× storage       │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Cluster         │ persistence_size │ 3 vmstorage     │ 3× storage       │
# └─────────────────┴──────────────────┴─────────────────┴──────────────────┘
# Example: 8Gi per pod → Single-node: 8Gi total, Cluster: 24Gi total
#
# KAFKA STORAGE:
# ┌─────────────────┬──────────────────┬─────────────────┬──────────────────┐
# │ Component       │ Per-Pod Storage  │ Number of Pods  │ Total Storage    │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Kafka Broker    │ persistence_size │ 3 pods          │ 3× storage       │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Kafka Controller│ persistence_size │ 3 pods          │ 3× storage       │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ TOTAL KAFKA     │ persistence_size │ 6 pods          │ 6× storage       │
# └─────────────────┴──────────────────┴─────────────────┴──────────────────┘
# Example: 8Gi per pod → 48Gi total Kafka storage
#
# COMBINED STORAGE EXAMPLES:
#   Default (8Gi each): VictoriaMetrics Cluster (24Gi) + Kafka (48Gi) = 72Gi total
#   Single-node mode:   VictoriaMetrics Single (8Gi) + Kafka (48Gi) = 56Gi total
#
# STORAGE OPTIONS:
#   - VictoriaMetrics: Store iDRAC telemetry in time-series database
#   - Kafka: Stream iDRAC and LDMS telemetry to Kafka topics
#   - Both: Store iDRAC in both Victoria and Kafka (recommended)
# ============================================================================

# ============================================================================
# iDRAC TELEMETRY CONFIGURATION
# ============================================================================
# iDRAC telemetry collects hardware metrics from Dell PowerEdge servers.
# Telemetry data can be stored in VictoriaMetrics, Kafka, or both.

# Enable or disable iDRAC telemetry support
# Accepted values: true or false
# Default: true
idrac_telemetry_support: true

# Specify where to store iDRAC telemetry data
# Supported values:
#   - "victoria"        : Store in VictoriaMetrics only
#   - "kafka"           : Store in Kafka only
#   - "victoria,kafka"  : Store in both (recommended)
# Default: "victoria,kafka"
idrac_telemetry_collection_type: "victoria,kafka"

# ============================================================================
# VICTORIAMETRICS CONFIGURATION
# ============================================================================
# VictoriaMetrics is a time-series database for storing telemetry metrics.
# Used for iDRAC telemetry when 'victoria' is enabled in idrac_telemetry_collection_type.
#
# DEPLOYMENT MODES:
#   - single-node: Simple deployment with one pod (suitable for small deployments)
#   - cluster: High-availability deployment with multiple components
#               (recommended for production and large-scale deployments)
victoria_configurations:
  # VictoriaMetrics deployment mode
  # Supported values:
  #   - "single-node" : Simple deployment (1 pod, suitable for dev/test)
  #   - "cluster"     : High-availability deployment (7 pods, recommended for production)
  # Default: "cluster"
  #
  # Cluster Mode Benefits:
  #   - High availability (no single point of failure)
  #   - Horizontal scalability (scale components independently)
  #   - Better performance (4x ingestion, 2x query speed)
  #   - Production-ready architecture
  #
  # Single-Node Benefits:
  #   - Simple setup (fewer resources)
  #   - Suitable for small deployments (<10 nodes)
  #   - Lower resource usage (~4Gi memory vs ~10Gi for cluster)
  deployment_mode: "cluster"

  # The amount of storage allocated for EACH VictoriaMetrics persistent volume.
  # IMPORTANT: Total VictoriaMetrics storage depends on deployment mode:
  #   - Single-node mode: Total storage = persistence_size × 1 pod
  #   - Cluster mode: Total storage = persistence_size × 3 vmstorage pods
  #   - Example (cluster): 8Gi × 3 = 24Gi total VictoriaMetrics storage
  # Accepted values: in the form of "X[Ki|Mi|Gi|Ti|Pi|Ei]"
  # Default: 8Gi (results in 24Gi total storage for cluster mode)
  persistence_size: "8Gi"

  # Duration (in hours) to retain victoria logs before they are deleted.
  # Default: 168 (7 days)
  retention_period: 168

# ============================================================================
# KAFKA CONFIGURATION
# ============================================================================
# Apache Kafka is a distributed streaming platform for storing telemetry data.
# Used for iDRAC telemetry when 'kafka' is enabled in idrac_telemetry_collection_type.
# Also used for LDMS telemetry when LDMS software is configured.
#
# NOTE: Kafka topics are auto-generated based on enabled features:
#   - 'idrac' topic: Required when idrac_telemetry_support=true and 'kafka' is enabled
#   - 'ldms' topic:  Required when LDMS is configured in software_config.json
kafka_configurations:
  # The amount of storage allocated for EACH Kafka persistent volume.
  # IMPORTANT: Total Kafka storage = persistence_size × 6 pods
  #   - 3 Kafka brokers (each gets persistence_size storage)
  #   - 3 Kafka controllers (each gets persistence_size storage)
  #   - Example: 8Gi × 6 = 48Gi total Kafka storage
  # Accepted values: in the form of "X[Ki|Mi|Gi|Ti|Pi|Ei]"
  # Default: 8Gi (results in 48Gi total storage)
  persistence_size: "8Gi"

  # The number of hours to retain Kafka logs before they are deleted.
  # Default: 168 (7 days)
  log_retention_hours: 168

  # The maximum size of Kafka logs (in bytes) before they are deleted.
  # Default: -1 (unlimited)
  log_retention_bytes: -1

  # The maximum size of Kafka log segments (in bytes) before they are deleted.
  # Default: 1073741824 (1 GB)
  log_segment_bytes: 1073741824

  # Kafka Topic Partitions Configuration
  # ----------------------------------------------------------------------------
  # Define the number of partitions for each Kafka topic.
  # Increasing partitions can improve throughput but also increases storage/overhead.
  #
  # IMPORTANT: Topic names are FIXED and cannot be changed.
  #   - Topic names: Only 'idrac' and 'ldms' are allowed
  #   - Configurable: Only partition counts can be modified
  #
  # Topic Requirements (auto-validated):
  #   - 'idrac': Required when idrac_telemetry_support=true and 'kafka' is enabled
  #   - 'ldms':  Required when LDMS software is configured in software_config.json
  #
  # Default partition counts: idrac=1, ldms=2
  topic_partitions:
    - name: "idrac"
      partitions: 1
    - name: "ldms"
      partitions: 2

# ============================================================================
# LDMS (Lightweight Distributed Metric Service) CONFIGURATION
# ============================================================================
# LDMS collects performance metrics from compute nodes (CPU, memory, network, etc.)
# and streams them to Kafka for storage and analysis.
#
# PREREQUISITE: To enable LDMS support, add the following to software_config.json:
#   {
#     "softwares": [
#       {"name": "ldms", "arch": ["x86_64", "aarch64"]}
#     ]
#   }
#
# When LDMS software is configured, the 'ldms' topic MUST be defined in
# kafka_configurations.topic_partitions above.
#
# LDMS Port Configurations
# Aggregator port on service k8s cluster
# Valid range: 6001-6100
# Default: 6001
ldms_agg_port: 6001

# Store daemon port on service k8s cluster
# Can be the same as ldms_agg_port
# Valid range: 6001-6100
# Default: 6001
ldms_store_port: 6001

# Sampler port on compute nodes
# Valid range: 10001-10100
# Default: 10001
ldms_sampler_port: 10001

# LDMS Sampler Plugin Configurations
# ----------------------------------------------------------------------------
# Configure which metrics to collect from compute nodes and collection intervals.
# Each plugin collects specific system metrics.
#
# Parameters:
#   - plugin_name: Name of the LDMS sampler plugin
#   - config_parameters: Plugin-specific configuration (as a single string)
#   - activation_parameters: Collection schedule in MICROSECONDS
#       Format: "interval=<microseconds> offset=<microseconds>"
#       Example: "interval=1000000"         (1000000 microseconds = 1 second)
#                "interval=1000000 offset=0" (1000000 microseconds with no offset)
#
# Available Plugins:
#   - meminfo: Memory usage statistics
#   - procstat2: Process statistics
#   - vmstat: Virtual memory statistics
#   - loadavg: System load average
#   - procnetdev2: Network interface statistics
ldms_sampler_configurations:
  # Memory usage statistics (free, used, buffers, cached, etc.)
  - plugin_name: meminfo
    config_parameters: ""
    activation_parameters: "interval=1000000"  # interval=1000000 microseconds

  # Process statistics (CPU, memory, I/O per process)
  - plugin_name: procstat2
    config_parameters: ""
    activation_parameters: "interval=1000000"  # interval=1000000 microseconds

  # Virtual memory statistics (paging, swapping, memory pressure)
  - plugin_name: vmstat
    config_parameters: ""
    activation_parameters: "interval=1000000"  # interval=1000000 microseconds

  # System load average (1, 5, and 15 minute averages)
  - plugin_name: loadavg
    config_parameters: ""
    activation_parameters: "interval=1000000"  # interval=1000000 microseconds

  # Network interface statistics (bytes, packets, errors, drops per interface)
  # Config parameters (optional):
  #   - ifaces=eth0,eth1: Specific interfaces to monitor
  #   - If not specified, all network interfaces will be monitored
  - plugin_name: procnetdev2
    config_parameters: ""  # Monitor all interfaces
    activation_parameters: "interval=1000000 offset=0"  # interval=1000000 microseconds, offset=0


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/with_service_k8s/only_login_node/user_registry_credential.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************
# user_registry credential manager
# name: User registry name, name should match exact name provided in local_repo_config.yml
# username: Provide if user registry requires username to authenticate
# password: Provide if user registry requires password to authenticate

user_registry_credential:
  - {name: "", username: "", password: ""}


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/without_service_k8s/only_login_compiler_node/high_availability_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# ***********************************************************************
# High Availability (HA) Configuration for Kubernetes (K8s) Service Node(List)
# - cluster_name is required field it should match one of the values defined in omnia_config.yml where deployment is set to true.
# - enable_k8s_ha: <Mandatory> Indicates whether to enable HA for the Kubernetes (K8s) service node. Set to 'true' to enable, 'false' to disable.
# - virtual_ip_address: <Mandatory if enable_k8s_ha is true> The virtual IP address for the K8s service node HA setup.
# ***********************************************************************

service_k8s_cluster_ha:
  - cluster_name: service_cluster
    enable_k8s_ha: true
    virtual_ip_address: "172.16.107.1"

================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/without_service_k8s/only_login_compiler_node/local_repo_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# You may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# ================================
# VARIABLE DETAILS
# ================================
# 1. user_repo_url_x86_64
#--------------------------
#    Optional list of user-defined repository URLs for x86_64 architecture.
#    Each entry can include: url, gpgkey, sslcacert, sslclientkey, sslclientcert, name, policy.
#    Used for custom cluster packages like <arch>_slurm_custom.
# Fields:
#   url         : Base URL of the repository
#   gpgkey      : GPG key URL (leave empty to disable gpgcheck; Omnia will trust this repo and user is responsible for its security)
#   name        : Name of the repository
#   sslcacert   : Path to SSL CA certificate (if using SSL)
#   sslclientkey: Path to SSL client key (if using SSL)
#   sslclientcert: Path to SSL client certificate (if using SSL)
#   policy      : Repository policy (always, partial)
# Notes:
#   - Do not use Jinja variables in this configuration.
#   - Omit SSL fields entirely if SSL is not in use.
#   - Its a madatory field in case of slurm_custom with name as '<arch>_slurm_custom'
#
# 2. user_repo_url_aarch64
#---------------------------
#    Same as above but for aarch64 architecture.
#
# 4. rhel_os_url_x86_64
#-----------------------------
#    Mandatory when RHEL subscription is not registered.
#    Contains repository URLs for codeready-builder, baseos, and appstream for x86_64.
# Fields:
#   url         : Base URL of the repository
#   gpgkey      : GPG key URL (leave empty to disable gpgcheck; Omnia will trust this repo and user is responsible for its security)
#   sslcacert   : Path to SSL CA certificate (if using SSL)
#   sslclientkey: Path to SSL client key (if using SSL)
#   sslclientcert: Path to SSL client certificate (if using SSL)
#   policy      : Repository policy if mentioned allowed values (always, partial). IF not mentioned will consider from software_config.json
#   name        : Name of the repository [ Allowed repo names <arch>_codeready-builder, <arch>_appstream, <arch>_baseos
# Notes:
#   - Do not use Jinja variables in this configuration.
#   - Omit SSL fields entirely if SSL is not in use.
#   - RHEL subscription is not registered, All 3 repositories [ <arch>_codeready-builder, <arch>_appstream, <arch>_baseos ]entries
#      are mandatory.
#
# 5. rhel_os_url_aarch64
#----------------------------
#    Same as above but for aarch64 architecture.
#
#### ADVANCE CONFIGURATIONS FOR LOCAL REPO ###
# 6. omnia_repo_url_rhel_x86_64
#-------------------------------
#    Mandatory repository URLs for downloading RPMS for Omnia features on RHEL x86_64.
#    Each entry includes url, gpgkey, and name.
#
# This variable defines all the repo urls from where rpms will be downloaded for omnia features when cluster_os_type is rhel and arch x86_64
# Making incorrect changes to this variable can cause omnia failure. Please edit cautiously.
# Fields:
#  url        : Base URL of the repository.
#  gpgkey     : URL of the GPG key for the repository.
#                   If left empty, gpgcheck=0 for that repository.
#  name       : A unique identifier for the repository or registry.
#
# 7. omnia_repo_url_rhel_aarch64
#--------------------------------
#    Same as above but for RHEL aarch64.

# ================================
# VARIABLES
# ================================
# Example    
# user_repo_url_x86_64:
#  - { url: "", gpgkey: "", sslcacert: "", sslclientkey: "", sslclientcert: "",  name: "x86_64_slurm_custom" }
user_repo_url_x86_64:
user_repo_url_aarch64:
#Example:
# rhel_os_url_x86_64:
#  - { url: "http://crb.com/CRB/x86_64/os/", gpgkey: "http://crb.com/CRB/x86_64/os/RPM-GPG-KEY", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "x86_64_codeready-builder"}
#  - { url: "http://BaseOS.com/BaseOS/x86_64/os/", gpgkey: "http://BaseOS.com/BaseOS/x86_64/os/RPM-GPG-KEY", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "x86_64_baseos"}
#  - { url: "http://AppStream.com/AppStream/x86_64/os/", gpgkey: "http://AppStream.com/AppStream/x86_64/os/RPM-GPG-KEY", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "x86_64_appstream" }
rhel_os_url_x86_64:
rhel_os_url_aarch64:
# Making incorrect changes to this variable can cause omnia failure. Please edit cautiously.
omnia_repo_url_rhel_x86_64:
  - { url: "https://download.docker.com/linux/centos/10/x86_64/stable/", gpgkey: "https://download.docker.com/linux/centos/gpg", name: "docker-ce"}
  - { url: "https://dl.fedoraproject.org/pub/epel/10/Everything/x86_64/", gpgkey: "https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-10", name: "epel"}
  - { url: "https://pkgs.k8s.io/core:/stable:/v1.34/rpm/", gpgkey: "https://pkgs.k8s.io/core:/stable:/v1.34/rpm/repodata/repomd.xml.key", name: "kubernetes"}
  - { url: "https://download.opensuse.org/repositories/isv:/cri-o:/stable:/v1.34/rpm/", gpgkey: "https://download.opensuse.org/repositories/isv:/cri-o:/stable:/v1.34/rpm/repodata/repomd.xml.key'", name: "cri-o"}
omnia_repo_url_rhel_aarch64:
  - { url: "https://download.docker.com/linux/centos/10/aarch64/stable/", gpgkey: "https://download.docker.com/linux/centos/gpg", name: "docker-ce"}
  - { url: "https://dl.fedoraproject.org/pub/epel/10/Everything/aarch64/", gpgkey: "https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-10", name: "epel"}


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/without_service_k8s/only_login_compiler_node/network_spec.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# This file is used to specify the network configuration.
#
# 'admin_network' is a mandatory field, essential for PXE boot and host communication."
#
# The 'admin_network' section contains the following variables:
# - 'oim_nic_name': The name of the interface on the OIM server associated with the admin network.
# - 'netmask_bits': The number of bits in the subnet mask.
# - 'primary_oim_admin_ip': The admin IP address of the OIM server which is configured.
# - 'primary_oim_bmc_ip': The iDRAC  IP address of the OIM server,
#     Mandatory only if idrac_telemetry is set to true and telemetry data needs to be collected from the OIM server.
#     Optional — can be omitted if iDRAC telemetry for the OIM server is not required.
# - 'dynamic_range': The range of dynamic IP addresses available on the admin network.
# - 'dns': The list of external DNS server IP address for the admin network.
# - 'ntp_servers': The list of NTP servers for the admin network. Each NTP server entry should include: 
#     - 'address': The IP address or hostname of the NTP server.
#     - 'type': The type of NTP entry, either 'server' or 'pool'.
#     Example:  
#     ntp_servers:
#       - { address: "172.16.10.80", type: "server" }

Networks:
- admin_network:
    oim_nic_name: "eno1"
    netmask_bits: "24"
    primary_oim_admin_ip: "172.16.107.254"
    primary_oim_bmc_ip: "" 
    dynamic_range: "172.16.107.201-172.16.107.250"
    dns: []
    ntp_servers: []


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/without_service_k8s/only_login_compiler_node/omnia_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# -----------------------------SLURM------------------------------------------------
# slurm_cluster
# List of slurm clusters
# cluster_name is required field

# nfs_storage_name
# Storage name corresponding to the NFS share to be used by slurm cluster 
# This should match with exactly with a entry in storage_config.yml

# config_sources
# defines how the Slurm configuration files are provided to the cluster.
# <conf name>: 
#    <mapping>
# <mapping> Supply the configuration values directly as a key–value map
# The conf files supported by slurm are
# slurm
# cgroup
# gres
# mpi
# helpers
# job_container
# acct_gather
# oci
# plugstack
# topology
# Thes files will be written into the slurm_config directory with .conf suffix

slurm_cluster:
  - cluster_name: slurm_cluster
    nfs_storage_name: nfs_slurm
    # config_sources:
    #   slurm:
    #     SlurmctldTimeout: 60
    #     SlurmdTimeout: 150
    #   cgroup: 
    #     CgroupPlugin: autodetect
    #     AllowedRAMSpace: 100
  
# ----------------------------SERVICE K8S------------------------------------------------------
# For service k8s cluster below parameters are required,(List)
# - cluster_name is required field

# - deployment: Exactly one entry in both the service_k8s_cluster lists must have deployment set to true to indicate where Kubernetes should be deployed.
# Please ensure corresponding cluster entry is added to high_availability_config.yml if deployment is set to true. 

# - Kubernetes SDN network.K8s_cni (Mandatory) - It can either be "calico" or "flannel".Default value assigned is "calico".
# While setting up Kubernetes plugin for RoCE NIC, ensure that this value is set to "flannel"

# - pod_external_ip_range: (Mandatory) These addresses will be used by Loadbalancer for assigning External IPs to K8s services
# Make sure the IP range is not assigned to any node in the cluster.
# Acceptable formats: "10.11.0.100-10.11.0.150" , "10.11.0.0/16"

# - k8s_service_addresses: Kubernetes internal network for services.This network must be unused in your network infrastructure.
# Default value is "10.233.0.0/18"

# - k8s_pod_network_cidr: Kubernetes pod network CIDR for internal network. When used, it will assign IP addresses from this range to individual pods.
# This network must be unused in your network infrastructure.
# Default value is "10.233.64.0/18"

# nfs_storage_name : The nfs name should be same as one of the nfs name defined in storage_config.yml to configure the server.
# ----------------------------CSI Driver------------------------------------------------------
# Following csi powerscale driver input variables are mandatory only if csi_driver_powerscale entry is present in software_config.json
# csi_powerscale_driver_secret_file_path: Absolute file path for the secret.yaml file.
# User need to download secret.yaml file and fill required data in secret file. Provided the path of the secret file here.
# File path for the values.yml file which will contain the Powerscale driver configuration parameters.
# csi_powerscale_driver_values_file_path: User need to download values.yaml file and fill required data in values.yaml file. Provided the path of the values.yaml file here.
# mention configurable values

service_k8s_cluster:
  - cluster_name: service_cluster
    deployment: true
    k8s_cni: "calico"
    pod_external_ip_range: "172.16.107.170-172.16.107.200"
    k8s_service_addresses: "10.233.0.0/18"
    k8s_pod_network_cidr: "10.233.64.0/18"
    nfs_storage_name: "nfs_k8s"
    csi_powerscale_driver_secret_file_path: ""
    csi_powerscale_driver_values_file_path: ""


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/without_service_k8s/only_login_compiler_node/provision_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

#### Mandatory
# This depicts the path where user has kept the PXE mapping file.
# The mapping file consists of the Service tag, Admin MAC,Hostname and its respective admin IP address and/or BMC IP.
# Ensure that admin IPs given in mapping file are within the network defined in the network_spec.yml
# A templates for mapping file exists in omnia/examples, namely, pxe_mapping_file.csv
# Format of csv: FUNCTIONAL_GROUP_NAME,GROUP_NAME,SERVICE_TAG,HOSTNAME,ADMIN_MAC,ADMIN_IP,BMC_MAC,BMC_IP
pxe_mapping_file_path: "/opt/omnia/input/project_default/pxe_mapping_file.csv"

#### Mandatory
# Language that needs to be set during OS provisioning.
# Only language supported is "en_US.UTF-8"
language: "en_US.UTF-8"

#### Mandatory
# Default lease time needs to be used by DHCP
# Unit: seconds
# Min: 21600
# Default: 86400
# Max: 31536000
default_lease_time: "86400"


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/without_service_k8s/only_login_compiler_node/security_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# Connection Type options: TLS or SSL
# Default: TLS (validated)
# If TLS: secure OpenLDAP connection occurs on port 389
# If SSL: secure OpenLDAP connection occurs on port 636
ldap_connection_type: "TLS"


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/without_service_k8s/only_login_compiler_node/software_config.json
================================================
{
    "cluster_os_type": "rhel",
    "cluster_os_version": "10.0",
    "repo_config": "partial",
    "softwares": [
        {"name": "default_packages", "arch": ["x86_64","aarch64"]},
        {"name": "openldap", "arch": ["x86_64","aarch64"]},
        {"name": "slurm_custom", "arch": ["x86_64","aarch64"]},
        {"name": "ldms", "arch": ["x86_64","aarch64"]}
    ],
    "slurm_custom": [
        {"name": "slurm_control_node"},
        {"name": "slurm_node"},
        {"name": "login_node"},
        {"name": "login_compiler_node"}
    ]
}


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/without_service_k8s/only_login_compiler_node/storage_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# -----------------------------NFS------------------------------------------------

# This variable is used for mounting NFS share on slurm_control_node, slurm_node, login_node
# This takes a list of dicts with possible keys server_ip, server_share_path, client_share_path, client_mount_options
# In both the cases, the USER must manually update 'server_ip' and 'server_share_path' below with the correct values.
# If mount_option values are empty, NFS client will be mounted with these values "nosuid,rw,sync,hard,intr"
# Its mandatory to provide atleast one entry in nfs_client_params
# Example for single mount file system:
# nfs_client_params:
# nfs_name : str ,Name of the NFS storage resource. The default is "nfs_storage_default".
#     The user can assign any custom string to specify a different NFS storage resource.
# - { server_ip: 10.5.0.101, server_share_path: "/mnt/share", client_share_path: "/home", client_mount_options: "nosuid,rw,sync,hard"}
# Example for supporting multiple mount points:
# nfs_client_params:
# - { server_ip: 198.168.0.1,server_share_path: "/mnt/share1", client_share_path: "/home", client_mount_options: "nosuid,rw,sync,hard"}
# - { server_ip: 198.168.0.2, server_share_path: "/mnt/share2", client_share_path: "/mnt/mount2", client_mount_options: "nosuid,rw,sync,hard"}
# Example for multiple mount file system:
# nfs_client_params:
# - { server_ip: 198.168.0.1, server_share_path: "/mnt/share1", client_share_path: "/mnt/mount1", client_mount_options: "nosuid,rw,sync,hard"}
# - { server_ip: 198.168.0.2, server_share_path: "/mnt/share2", client_share_path: "/mnt/mount2", client_mount_options: "nosuid,rw,sync,hard"}
nfs_client_params:
  - server_ip: "172.16.107.168" # Provide the IP of the NFS server
    server_share_path: "/mnt/share/omnia" # Provide server share path of the NFS Server
    client_share_path: /share_omnia
    client_mount_options: "nosuid,rw,sync,hard,intr"
    nfs_name: nfs_slurm

  - server_ip: "172.16.107.121" # Provide the IP of the NFS server
    server_share_path: "/mnt/share/omnia_k8s" # Provide server share path of the NFS Server
    client_share_path: /share_omnia_k8s
    client_mount_options: "nosuid,rw,sync,hard,intr"
    nfs_name: nfs_k8s


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/without_service_k8s/only_login_compiler_node/telemetry_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# ============================================================================
# TELEMETRY CONFIGURATION OVERVIEW
# ============================================================================
# This file configures telemetry data collection and storage for Dell Omnia.
#
# SECTIONS:
#   1. iDRAC Telemetry    : Hardware metrics from Dell PowerEdge servers
#   2. VictoriaMetrics    : Time-series database for metric storage
#   3. Kafka              : Distributed streaming platform for telemetry data
#   4. LDMS               : Lightweight Distributed Metric Service for compute nodes
#
# ============================================================================
# STORAGE REQUIREMENTS SUMMARY
# ============================================================================
# 
# VICTORIAMETRICS STORAGE:
# ┌─────────────────┬──────────────────┬─────────────────┬──────────────────┐
# │ Deployment Mode │ Per-Pod Storage  │ Number of Pods  │ Total Storage    │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Single-node     │ persistence_size │ 1 pod           │ 1× storage       │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Cluster         │ persistence_size │ 3 vmstorage     │ 3× storage       │
# └─────────────────┴──────────────────┴─────────────────┴──────────────────┘
# Example: 8Gi per pod → Single-node: 8Gi total, Cluster: 24Gi total
#
# KAFKA STORAGE:
# ┌─────────────────┬──────────────────┬─────────────────┬──────────────────┐
# │ Component       │ Per-Pod Storage  │ Number of Pods  │ Total Storage    │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Kafka Broker    │ persistence_size │ 3 pods          │ 3× storage       │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Kafka Controller│ persistence_size │ 3 pods          │ 3× storage       │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ TOTAL KAFKA     │ persistence_size │ 6 pods          │ 6× storage       │
# └─────────────────┴──────────────────┴─────────────────┴──────────────────┘
# Example: 8Gi per pod → 48Gi total Kafka storage
#
# COMBINED STORAGE EXAMPLES:
#   Default (8Gi each): VictoriaMetrics Cluster (24Gi) + Kafka (48Gi) = 72Gi total
#   Single-node mode:   VictoriaMetrics Single (8Gi) + Kafka (48Gi) = 56Gi total
#
# STORAGE OPTIONS:
#   - VictoriaMetrics: Store iDRAC telemetry in time-series database
#   - Kafka: Stream iDRAC and LDMS telemetry to Kafka topics
#   - Both: Store iDRAC in both Victoria and Kafka (recommended)
# ============================================================================

# ============================================================================
# iDRAC TELEMETRY CONFIGURATION
# ============================================================================
# iDRAC telemetry collects hardware metrics from Dell PowerEdge servers.
# Telemetry data can be stored in VictoriaMetrics, Kafka, or both.

# Enable or disable iDRAC telemetry support
# Accepted values: true or false
# Default: true
idrac_telemetry_support: true

# Specify where to store iDRAC telemetry data
# Supported values:
#   - "victoria"        : Store in VictoriaMetrics only
#   - "kafka"           : Store in Kafka only
#   - "victoria,kafka"  : Store in both (recommended)
# Default: "victoria,kafka"
idrac_telemetry_collection_type: "victoria,kafka"

# ============================================================================
# VICTORIAMETRICS CONFIGURATION
# ============================================================================
# VictoriaMetrics is a time-series database for storing telemetry metrics.
# Used for iDRAC telemetry when 'victoria' is enabled in idrac_telemetry_collection_type.
#
# DEPLOYMENT MODES:
#   - single-node: Simple deployment with one pod (suitable for small deployments)
#   - cluster: High-availability deployment with multiple components
#               (recommended for production and large-scale deployments)
victoria_configurations:
  # VictoriaMetrics deployment mode
  # Supported values:
  #   - "single-node" : Simple deployment (1 pod, suitable for dev/test)
  #   - "cluster"     : High-availability deployment (7 pods, recommended for production)
  # Default: "cluster"
  #
  # Cluster Mode Benefits:
  #   - High availability (no single point of failure)
  #   - Horizontal scalability (scale components independently)
  #   - Better performance (4x ingestion, 2x query speed)
  #   - Production-ready architecture
  #
  # Single-Node Benefits:
  #   - Simple setup (fewer resources)
  #   - Suitable for small deployments (<10 nodes)
  #   - Lower resource usage (~4Gi memory vs ~10Gi for cluster)
  deployment_mode: "cluster"

  # The amount of storage allocated for EACH VictoriaMetrics persistent volume.
  # IMPORTANT: Total VictoriaMetrics storage depends on deployment mode:
  #   - Single-node mode: Total storage = persistence_size × 1 pod
  #   - Cluster mode: Total storage = persistence_size × 3 vmstorage pods
  #   - Example (cluster): 8Gi × 3 = 24Gi total VictoriaMetrics storage
  # Accepted values: in the form of "X[Ki|Mi|Gi|Ti|Pi|Ei]"
  # Default: 8Gi (results in 24Gi total storage for cluster mode)
  persistence_size: "8Gi"

  # Duration (in hours) to retain victoria logs before they are deleted.
  # Default: 168 (7 days)
  retention_period: 168

# ============================================================================
# KAFKA CONFIGURATION
# ============================================================================
# Apache Kafka is a distributed streaming platform for storing telemetry data.
# Used for iDRAC telemetry when 'kafka' is enabled in idrac_telemetry_collection_type.
# Also used for LDMS telemetry when LDMS software is configured.
#
# NOTE: Kafka topics are auto-generated based on enabled features:
#   - 'idrac' topic: Required when idrac_telemetry_support=true and 'kafka' is enabled
#   - 'ldms' topic:  Required when LDMS is configured in software_config.json
kafka_configurations:
  # The amount of storage allocated for EACH Kafka persistent volume.
  # IMPORTANT: Total Kafka storage = persistence_size × 6 pods
  #   - 3 Kafka brokers (each gets persistence_size storage)
  #   - 3 Kafka controllers (each gets persistence_size storage)
  #   - Example: 8Gi × 6 = 48Gi total Kafka storage
  # Accepted values: in the form of "X[Ki|Mi|Gi|Ti|Pi|Ei]"
  # Default: 8Gi (results in 48Gi total storage)
  persistence_size: "8Gi"

  # The number of hours to retain Kafka logs before they are deleted.
  # Default: 168 (7 days)
  log_retention_hours: 168

  # The maximum size of Kafka logs (in bytes) before they are deleted.
  # Default: -1 (unlimited)
  log_retention_bytes: -1

  # The maximum size of Kafka log segments (in bytes) before they are deleted.
  # Default: 1073741824 (1 GB)
  log_segment_bytes: 1073741824

  # Kafka Topic Partitions Configuration
  # ----------------------------------------------------------------------------
  # Define the number of partitions for each Kafka topic.
  # Increasing partitions can improve throughput but also increases storage/overhead.
  #
  # IMPORTANT: Topic names are FIXED and cannot be changed.
  #   - Topic names: Only 'idrac' and 'ldms' are allowed
  #   - Configurable: Only partition counts can be modified
  #
  # Topic Requirements (auto-validated):
  #   - 'idrac': Required when idrac_telemetry_support=true and 'kafka' is enabled
  #   - 'ldms':  Required when LDMS software is configured in software_config.json
  #
  # Default partition counts: idrac=1, ldms=2
  topic_partitions:
    - name: "idrac"
      partitions: 1
    - name: "ldms"
      partitions: 2

# ============================================================================
# LDMS (Lightweight Distributed Metric Service) CONFIGURATION
# ============================================================================
# LDMS collects performance metrics from compute nodes (CPU, memory, network, etc.)
# and streams them to Kafka for storage and analysis.
#
# PREREQUISITE: To enable LDMS support, add the following to software_config.json:
#   {
#     "softwares": [
#       {"name": "ldms", "arch": ["x86_64", "aarch64"]}
#     ]
#   }
#
# When LDMS software is configured, the 'ldms' topic MUST be defined in
# kafka_configurations.topic_partitions above.
#
# LDMS Port Configurations
# Aggregator port on service k8s cluster
# Valid range: 6001-6100
# Default: 6001
ldms_agg_port: 6001

# Store daemon port on service k8s cluster
# Can be the same as ldms_agg_port
# Valid range: 6001-6100
# Default: 6001
ldms_store_port: 6001

# Sampler port on compute nodes
# Valid range: 10001-10100
# Default: 10001
ldms_sampler_port: 10001

# LDMS Sampler Plugin Configurations
# ----------------------------------------------------------------------------
# Configure which metrics to collect from compute nodes and collection intervals.
# Each plugin collects specific system metrics.
#
# Parameters:
#   - plugin_name: Name of the LDMS sampler plugin
#   - config_parameters: Plugin-specific configuration (as a single string)
#   - activation_parameters: Collection schedule in MICROSECONDS
#       Format: "interval=<microseconds> offset=<microseconds>"
#       Example: "interval=1000000"         (1000000 microseconds = 1 second)
#                "interval=1000000 offset=0" (1000000 microseconds with no offset)
#
# Available Plugins:
#   - meminfo: Memory usage statistics
#   - procstat2: Process statistics
#   - vmstat: Virtual memory statistics
#   - loadavg: System load average
#   - procnetdev2: Network interface statistics
ldms_sampler_configurations:
  # Memory usage statistics (free, used, buffers, cached, etc.)
  - plugin_name: meminfo
    config_parameters: ""
    activation_parameters: "interval=1000000"  # interval=1000000 microseconds

  # Process statistics (CPU, memory, I/O per process)
  - plugin_name: procstat2
    config_parameters: ""
    activation_parameters: "interval=1000000"  # interval=1000000 microseconds

  # Virtual memory statistics (paging, swapping, memory pressure)
  - plugin_name: vmstat
    config_parameters: ""
    activation_parameters: "interval=1000000"  # interval=1000000 microseconds

  # System load average (1, 5, and 15 minute averages)
  - plugin_name: loadavg
    config_parameters: ""
    activation_parameters: "interval=1000000"  # interval=1000000 microseconds

  # Network interface statistics (bytes, packets, errors, drops per interface)
  # Config parameters (optional):
  #   - ifaces=eth0,eth1: Specific interfaces to monitor
  #   - If not specified, all network interfaces will be monitored
  - plugin_name: procnetdev2
    config_parameters: ""  # Monitor all interfaces
    activation_parameters: "interval=1000000 offset=0"  # interval=1000000 microseconds, offset=0


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/without_service_k8s/only_login_compiler_node/user_registry_credential.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************
# user_registry credential manager
# name: User registry name, name should match exact name provided in local_repo_config.yml
# username: Provide if user registry requires username to authenticate
# password: Provide if user registry requires password to authenticate

user_registry_credential:
  - {name: "", username: "", password: ""}


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/without_service_k8s/only_login_node/high_availability_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# ***********************************************************************
# High Availability (HA) Configuration for Kubernetes (K8s) Service Node(List)
# - cluster_name is required field it should match one of the values defined in omnia_config.yml where deployment is set to true.
# - enable_k8s_ha: <Mandatory> Indicates whether to enable HA for the Kubernetes (K8s) service node. Set to 'true' to enable, 'false' to disable.
# - virtual_ip_address: <Mandatory if enable_k8s_ha is true> The virtual IP address for the K8s service node HA setup.
# ***********************************************************************

service_k8s_cluster_ha:
  - cluster_name: service_cluster
    enable_k8s_ha: true
    virtual_ip_address: "172.16.107.1"

================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/without_service_k8s/only_login_node/local_repo_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# You may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# ================================
# VARIABLE DETAILS
# ================================
# 1. user_repo_url_x86_64
#--------------------------
#    Optional list of user-defined repository URLs for x86_64 architecture.
#    Each entry can include: url, gpgkey, sslcacert, sslclientkey, sslclientcert, name, policy.
#    Used for custom cluster packages like <arch>_slurm_custom.
# Fields:
#   url         : Base URL of the repository
#   gpgkey      : GPG key URL (leave empty to disable gpgcheck; Omnia will trust this repo and user is responsible for its security)
#   name        : Name of the repository
#   sslcacert   : Path to SSL CA certificate (if using SSL)
#   sslclientkey: Path to SSL client key (if using SSL)
#   sslclientcert: Path to SSL client certificate (if using SSL)
#   policy      : Repository policy (always, partial)
# Notes:
#   - Do not use Jinja variables in this configuration.
#   - Omit SSL fields entirely if SSL is not in use.
#   - Its a madatory field in case of slurm_custom with name as '<arch>_slurm_custom'
#
# 2. user_repo_url_aarch64
#---------------------------
#    Same as above but for aarch64 architecture.
#
# 4. rhel_os_url_x86_64
#-----------------------------
#    Mandatory when RHEL subscription is not registered.
#    Contains repository URLs for codeready-builder, baseos, and appstream for x86_64.
# Fields:
#   url         : Base URL of the repository
#   gpgkey      : GPG key URL (leave empty to disable gpgcheck; Omnia will trust this repo and user is responsible for its security)
#   sslcacert   : Path to SSL CA certificate (if using SSL)
#   sslclientkey: Path to SSL client key (if using SSL)
#   sslclientcert: Path to SSL client certificate (if using SSL)
#   policy      : Repository policy if mentioned allowed values (always, partial). IF not mentioned will consider from software_config.json
#   name        : Name of the repository [ Allowed repo names <arch>_codeready-builder, <arch>_appstream, <arch>_baseos
# Notes:
#   - Do not use Jinja variables in this configuration.
#   - Omit SSL fields entirely if SSL is not in use.
#   - RHEL subscription is not registered, All 3 repositories [ <arch>_codeready-builder, <arch>_appstream, <arch>_baseos ]entries
#      are mandatory.
#
# 5. rhel_os_url_aarch64
#----------------------------
#    Same as above but for aarch64 architecture.
#
#### ADVANCE CONFIGURATIONS FOR LOCAL REPO ###
# 6. omnia_repo_url_rhel_x86_64
#-------------------------------
#    Mandatory repository URLs for downloading RPMS for Omnia features on RHEL x86_64.
#    Each entry includes url, gpgkey, and name.
#
# This variable defines all the repo urls from where rpms will be downloaded for omnia features when cluster_os_type is rhel and arch x86_64
# Making incorrect changes to this variable can cause omnia failure. Please edit cautiously.
# Fields:
#  url        : Base URL of the repository.
#  gpgkey     : URL of the GPG key for the repository.
#                   If left empty, gpgcheck=0 for that repository.
#  name       : A unique identifier for the repository or registry.
#
# 7. omnia_repo_url_rhel_aarch64
#--------------------------------
#    Same as above but for RHEL aarch64.

# ================================
# VARIABLES
# ================================
# Example    
# user_repo_url_x86_64:
#  - { url: "", gpgkey: "", sslcacert: "", sslclientkey: "", sslclientcert: "",  name: "x86_64_slurm_custom" }
user_repo_url_x86_64:
user_repo_url_aarch64:
#Example:
# rhel_os_url_x86_64:
#  - { url: "http://crb.com/CRB/x86_64/os/", gpgkey: "http://crb.com/CRB/x86_64/os/RPM-GPG-KEY", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "x86_64_codeready-builder"}
#  - { url: "http://BaseOS.com/BaseOS/x86_64/os/", gpgkey: "http://BaseOS.com/BaseOS/x86_64/os/RPM-GPG-KEY", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "x86_64_baseos"}
#  - { url: "http://AppStream.com/AppStream/x86_64/os/", gpgkey: "http://AppStream.com/AppStream/x86_64/os/RPM-GPG-KEY", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "x86_64_appstream" }
rhel_os_url_x86_64:
rhel_os_url_aarch64:
# Making incorrect changes to this variable can cause omnia failure. Please edit cautiously.
omnia_repo_url_rhel_x86_64:
  - { url: "https://download.docker.com/linux/centos/10/x86_64/stable/", gpgkey: "https://download.docker.com/linux/centos/gpg", name: "docker-ce"}
  - { url: "https://dl.fedoraproject.org/pub/epel/10/Everything/x86_64/", gpgkey: "https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-10", name: "epel"}
  - { url: "https://pkgs.k8s.io/core:/stable:/v1.34/rpm/", gpgkey: "https://pkgs.k8s.io/core:/stable:/v1.34/rpm/repodata/repomd.xml.key", name: "kubernetes"}
  - { url: "https://download.opensuse.org/repositories/isv:/cri-o:/stable:/v1.34/rpm/", gpgkey: "https://download.opensuse.org/repositories/isv:/cri-o:/stable:/v1.34/rpm/repodata/repomd.xml.key'", name: "cri-o"}
omnia_repo_url_rhel_aarch64:
  - { url: "https://download.docker.com/linux/centos/10/aarch64/stable/", gpgkey: "https://download.docker.com/linux/centos/gpg", name: "docker-ce"}
  - { url: "https://dl.fedoraproject.org/pub/epel/10/Everything/aarch64/", gpgkey: "https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-10", name: "epel"}


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/without_service_k8s/only_login_node/network_spec.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# This file is used to specify the network configuration.
#
# 'admin_network' is a mandatory field, essential for PXE boot and host communication."
#
# The 'admin_network' section contains the following variables:
# - 'oim_nic_name': The name of the interface on the OIM server associated with the admin network.
# - 'netmask_bits': The number of bits in the subnet mask.
# - 'primary_oim_admin_ip': The admin IP address of the OIM server which is configured.
# - 'primary_oim_bmc_ip': The iDRAC  IP address of the OIM server,
#     Mandatory only if idrac_telemetry is set to true and telemetry data needs to be collected from the OIM server.
#     Optional — can be omitted if iDRAC telemetry for the OIM server is not required.
# - 'dynamic_range': The range of dynamic IP addresses available on the admin network.
# - 'dns': The list of external DNS server IP address for the admin network.
# - 'ntp_servers': The list of NTP servers for the admin network. Each NTP server entry should include: 
#     - 'address': The IP address or hostname of the NTP server.
#     - 'type': The type of NTP entry, either 'server' or 'pool'.
#     Example:  
#     ntp_servers:
#       - { address: "172.16.10.80", type: "server" }

Networks:
- admin_network:
    oim_nic_name: "eno1"
    netmask_bits: "24"
    primary_oim_admin_ip: "172.16.107.254"
    primary_oim_bmc_ip: "" 
    dynamic_range: "172.16.107.201-172.16.107.250"
    dns: []
    ntp_servers: []


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/without_service_k8s/only_login_node/omnia_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# -----------------------------SLURM------------------------------------------------
# slurm_cluster
# List of slurm clusters
# cluster_name is required field

# nfs_storage_name
# Storage name corresponding to the NFS share to be used by slurm cluster 
# This should match with exactly with a entry in storage_config.yml

# config_sources
# defines how the Slurm configuration files are provided to the cluster.
# <conf name>: 
#    <mapping>
# <mapping> Supply the configuration values directly as a key–value map
# The conf files supported by slurm are
# slurm
# cgroup
# gres
# mpi
# helpers
# job_container
# acct_gather
# oci
# plugstack
# topology
# Thes files will be written into the slurm_config directory with .conf suffix

slurm_cluster:
  - cluster_name: slurm_cluster
    nfs_storage_name: nfs_slurm
    # config_sources:
    #   slurm:
    #     SlurmctldTimeout: 60
    #     SlurmdTimeout: 150
    #   cgroup: 
    #     CgroupPlugin: autodetect
    #     AllowedRAMSpace: 100
  
# ----------------------------SERVICE K8S------------------------------------------------------
# For service k8s cluster below parameters are required,(List)
# - cluster_name is required field

# - deployment: Exactly one entry in both the service_k8s_cluster lists must have deployment set to true to indicate where Kubernetes should be deployed.
# Please ensure corresponding cluster entry is added to high_availability_config.yml if deployment is set to true. 

# - Kubernetes SDN network.K8s_cni (Mandatory) - It can either be "calico" or "flannel".Default value assigned is "calico".
# While setting up Kubernetes plugin for RoCE NIC, ensure that this value is set to "flannel"

# - pod_external_ip_range: (Mandatory) These addresses will be used by Loadbalancer for assigning External IPs to K8s services
# Make sure the IP range is not assigned to any node in the cluster.
# Acceptable formats: "10.11.0.100-10.11.0.150" , "10.11.0.0/16"

# - k8s_service_addresses: Kubernetes internal network for services.This network must be unused in your network infrastructure.
# Default value is "10.233.0.0/18"

# - k8s_pod_network_cidr: Kubernetes pod network CIDR for internal network. When used, it will assign IP addresses from this range to individual pods.
# This network must be unused in your network infrastructure.
# Default value is "10.233.64.0/18"

# nfs_storage_name : The nfs name should be same as one of the nfs name defined in storage_config.yml to configure the server.
# ----------------------------CSI Driver------------------------------------------------------
# Following csi powerscale driver input variables are mandatory only if csi_driver_powerscale entry is present in software_config.json
# csi_powerscale_driver_secret_file_path: Absolute file path for the secret.yaml file.
# User need to download secret.yaml file and fill required data in secret file. Provided the path of the secret file here.
# File path for the values.yml file which will contain the Powerscale driver configuration parameters.
# csi_powerscale_driver_values_file_path: User need to download values.yaml file and fill required data in values.yaml file. Provided the path of the values.yaml file here.
# mention configurable values

service_k8s_cluster:
  - cluster_name: service_cluster
    deployment: true
    k8s_cni: "calico"
    pod_external_ip_range: "172.16.107.170-172.16.107.200"
    k8s_service_addresses: "10.233.0.0/18"
    k8s_pod_network_cidr: "10.233.64.0/18"
    nfs_storage_name: "nfs_k8s"
    csi_powerscale_driver_secret_file_path: ""
    csi_powerscale_driver_values_file_path: ""


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/without_service_k8s/only_login_node/provision_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

#### Mandatory
# This depicts the path where user has kept the PXE mapping file.
# The mapping file consists of the Service tag, Admin MAC,Hostname and its respective admin IP address and/or BMC IP.
# Ensure that admin IPs given in mapping file are within the network defined in the network_spec.yml
# A templates for mapping file exists in omnia/examples, namely, pxe_mapping_file.csv
# Format of csv: FUNCTIONAL_GROUP_NAME,GROUP_NAME,SERVICE_TAG,HOSTNAME,ADMIN_MAC,ADMIN_IP,BMC_MAC,BMC_IP
pxe_mapping_file_path: "/opt/omnia/input/project_default/pxe_mapping_file.csv"

#### Mandatory
# Language that needs to be set during OS provisioning.
# Only language supported is "en_US.UTF-8"
language: "en_US.UTF-8"

#### Mandatory
# Default lease time needs to be used by DHCP
# Unit: seconds
# Min: 21600
# Default: 86400
# Max: 31536000
default_lease_time: "86400"


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/without_service_k8s/only_login_node/security_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# Connection Type options: TLS or SSL
# Default: TLS (validated)
# If TLS: secure OpenLDAP connection occurs on port 389
# If SSL: secure OpenLDAP connection occurs on port 636
ldap_connection_type: "TLS"


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/without_service_k8s/only_login_node/software_config.json
================================================
{
    "cluster_os_type": "rhel",
    "cluster_os_version": "10.0",
    "repo_config": "partial",
    "softwares": [
        {"name": "default_packages", "arch": ["x86_64","aarch64"]},
        {"name": "openldap", "arch": ["x86_64","aarch64"]},
        {"name": "slurm_custom", "arch": ["x86_64","aarch64"]},
        {"name": "ldms", "arch": ["x86_64","aarch64"]}
    ],
    "slurm_custom": [
        {"name": "slurm_control_node"},
        {"name": "slurm_node"},
        {"name": "login_node"}
    ]

}


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/without_service_k8s/only_login_node/storage_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# -----------------------------NFS------------------------------------------------

# This variable is used for mounting NFS share on slurm_control_node, slurm_node, login_node
# This takes a list of dicts with possible keys server_ip, server_share_path, client_share_path, client_mount_options
# In both the cases, the USER must manually update 'server_ip' and 'server_share_path' below with the correct values.
# If mount_option values are empty, NFS client will be mounted with these values "nosuid,rw,sync,hard,intr"
# Its mandatory to provide atleast one entry in nfs_client_params
# Example for single mount file system:
# nfs_client_params:
# nfs_name : str ,Name of the NFS storage resource. The default is "nfs_storage_default".
#     The user can assign any custom string to specify a different NFS storage resource.
# - { server_ip: 10.5.0.101, server_share_path: "/mnt/share", client_share_path: "/home", client_mount_options: "nosuid,rw,sync,hard"}
# Example for supporting multiple mount points:
# nfs_client_params:
# - { server_ip: 198.168.0.1,server_share_path: "/mnt/share1", client_share_path: "/home", client_mount_options: "nosuid,rw,sync,hard"}
# - { server_ip: 198.168.0.2, server_share_path: "/mnt/share2", client_share_path: "/mnt/mount2", client_mount_options: "nosuid,rw,sync,hard"}
# Example for multiple mount file system:
# nfs_client_params:
# - { server_ip: 198.168.0.1, server_share_path: "/mnt/share1", client_share_path: "/mnt/mount1", client_mount_options: "nosuid,rw,sync,hard"}
# - { server_ip: 198.168.0.2, server_share_path: "/mnt/share2", client_share_path: "/mnt/mount2", client_mount_options: "nosuid,rw,sync,hard"}
nfs_client_params:
  - server_ip: "172.16.107.168" # Provide the IP of the NFS server
    server_share_path: "/mnt/share/omnia" # Provide server share path of the NFS Server
    client_share_path: /share_omnia
    client_mount_options: "nosuid,rw,sync,hard,intr"
    nfs_name: nfs_slurm

  - server_ip: "172.16.107.121" # Provide the IP of the NFS server
    server_share_path: "/mnt/share/omnia_k8s" # Provide server share path of the NFS Server
    client_share_path: /share_omnia_k8s
    client_mount_options: "nosuid,rw,sync,hard,intr"
    nfs_name: nfs_k8s


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/without_service_k8s/only_login_node/telemetry_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# ============================================================================
# TELEMETRY CONFIGURATION OVERVIEW
# ============================================================================
# This file configures telemetry data collection and storage for Dell Omnia.
#
# SECTIONS:
#   1. iDRAC Telemetry    : Hardware metrics from Dell PowerEdge servers
#   2. VictoriaMetrics    : Time-series database for metric storage
#   3. Kafka              : Distributed streaming platform for telemetry data
#   4. LDMS               : Lightweight Distributed Metric Service for compute nodes
#
# ============================================================================
# STORAGE REQUIREMENTS SUMMARY
# ============================================================================
# 
# VICTORIAMETRICS STORAGE:
# ┌─────────────────┬──────────────────┬─────────────────┬──────────────────┐
# │ Deployment Mode │ Per-Pod Storage  │ Number of Pods  │ Total Storage    │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Single-node     │ persistence_size │ 1 pod           │ 1× storage       │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Cluster         │ persistence_size │ 3 vmstorage     │ 3× storage       │
# └─────────────────┴──────────────────┴─────────────────┴──────────────────┘
# Example: 8Gi per pod → Single-node: 8Gi total, Cluster: 24Gi total
#
# KAFKA STORAGE:
# ┌─────────────────┬──────────────────┬─────────────────┬──────────────────┐
# │ Component       │ Per-Pod Storage  │ Number of Pods  │ Total Storage    │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Kafka Broker    │ persistence_size │ 3 pods          │ 3× storage       │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Kafka Controller│ persistence_size │ 3 pods          │ 3× storage       │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ TOTAL KAFKA     │ persistence_size │ 6 pods          │ 6× storage       │
# └─────────────────┴──────────────────┴─────────────────┴──────────────────┘
# Example: 8Gi per pod → 48Gi total Kafka storage
#
# COMBINED STORAGE EXAMPLES:
#   Default (8Gi each): VictoriaMetrics Cluster (24Gi) + Kafka (48Gi) = 72Gi total
#   Single-node mode:   VictoriaMetrics Single (8Gi) + Kafka (48Gi) = 56Gi total
#
# STORAGE OPTIONS:
#   - VictoriaMetrics: Store iDRAC telemetry in time-series database
#   - Kafka: Stream iDRAC and LDMS telemetry to Kafka topics
#   - Both: Store iDRAC in both Victoria and Kafka (recommended)
# ============================================================================

# ============================================================================
# iDRAC TELEMETRY CONFIGURATION
# ============================================================================
# iDRAC telemetry collects hardware metrics from Dell PowerEdge servers.
# Telemetry data can be stored in VictoriaMetrics, Kafka, or both.

# Enable or disable iDRAC telemetry support
# Accepted values: true or false
# Default: true
idrac_telemetry_support: true

# Specify where to store iDRAC telemetry data
# Supported values:
#   - "victoria"        : Store in VictoriaMetrics only
#   - "kafka"           : Store in Kafka only
#   - "victoria,kafka"  : Store in both (recommended)
# Default: "victoria,kafka"
idrac_telemetry_collection_type: "victoria,kafka"

# ============================================================================
# VICTORIAMETRICS CONFIGURATION
# ============================================================================
# VictoriaMetrics is a time-series database for storing telemetry metrics.
# Used for iDRAC telemetry when 'victoria' is enabled in idrac_telemetry_collection_type.
#
# DEPLOYMENT MODES:
#   - single-node: Simple deployment with one pod (suitable for small deployments)
#   - cluster: High-availability deployment with multiple components
#               (recommended for production and large-scale deployments)
victoria_configurations:
  # VictoriaMetrics deployment mode
  # Supported values:
  #   - "single-node" : Simple deployment (1 pod, suitable for dev/test)
  #   - "cluster"     : High-availability deployment (7 pods, recommended for production)
  # Default: "cluster"
  #
  # Cluster Mode Benefits:
  #   - High availability (no single point of failure)
  #   - Horizontal scalability (scale components independently)
  #   - Better performance (4x ingestion, 2x query speed)
  #   - Production-ready architecture
  #
  # Single-Node Benefits:
  #   - Simple setup (fewer resources)
  #   - Suitable for small deployments (<10 nodes)
  #   - Lower resource usage (~4Gi memory vs ~10Gi for cluster)
  deployment_mode: "cluster"

  # The amount of storage allocated for EACH VictoriaMetrics persistent volume.
  # IMPORTANT: Total VictoriaMetrics storage depends on deployment mode:
  #   - Single-node mode: Total storage = persistence_size × 1 pod
  #   - Cluster mode: Total storage = persistence_size × 3 vmstorage pods
  #   - Example (cluster): 8Gi × 3 = 24Gi total VictoriaMetrics storage
  # Accepted values: in the form of "X[Ki|Mi|Gi|Ti|Pi|Ei]"
  # Default: 8Gi (results in 24Gi total storage for cluster mode)
  persistence_size: "8Gi"

  # Duration (in hours) to retain victoria logs before they are deleted.
  # Default: 168 (7 days)
  retention_period: 168

# ============================================================================
# KAFKA CONFIGURATION
# ============================================================================
# Apache Kafka is a distributed streaming platform for storing telemetry data.
# Used for iDRAC telemetry when 'kafka' is enabled in idrac_telemetry_collection_type.
# Also used for LDMS telemetry when LDMS software is configured.
#
# NOTE: Kafka topics are auto-generated based on enabled features:
#   - 'idrac' topic: Required when idrac_telemetry_support=true and 'kafka' is enabled
#   - 'ldms' topic:  Required when LDMS is configured in software_config.json
kafka_configurations:
  # The amount of storage allocated for EACH Kafka persistent volume.
  # IMPORTANT: Total Kafka storage = persistence_size × 6 pods
  #   - 3 Kafka brokers (each gets persistence_size storage)
  #   - 3 Kafka controllers (each gets persistence_size storage)
  #   - Example: 8Gi × 6 = 48Gi total Kafka storage
  # Accepted values: in the form of "X[Ki|Mi|Gi|Ti|Pi|Ei]"
  # Default: 8Gi (results in 48Gi total storage)
  persistence_size: "8Gi"

  # The number of hours to retain Kafka logs before they are deleted.
  # Default: 168 (7 days)
  log_retention_hours: 168

  # The maximum size of Kafka logs (in bytes) before they are deleted.
  # Default: -1 (unlimited)
  log_retention_bytes: -1

  # The maximum size of Kafka log segments (in bytes) before they are deleted.
  # Default: 1073741824 (1 GB)
  log_segment_bytes: 1073741824

  # Kafka Topic Partitions Configuration
  # ----------------------------------------------------------------------------
  # Define the number of partitions for each Kafka topic.
  # Increasing partitions can improve throughput but also increases storage/overhead.
  #
  # IMPORTANT: Topic names are FIXED and cannot be changed.
  #   - Topic names: Only 'idrac' and 'ldms' are allowed
  #   - Configurable: Only partition counts can be modified
  #
  # Topic Requirements (auto-validated):
  #   - 'idrac': Required when idrac_telemetry_support=true and 'kafka' is enabled
  #   - 'ldms':  Required when LDMS software is configured in software_config.json
  #
  # Default partition counts: idrac=1, ldms=2
  topic_partitions:
    - name: "idrac"
      partitions: 1
    - name: "ldms"
      partitions: 2

# ============================================================================
# LDMS (Lightweight Distributed Metric Service) CONFIGURATION
# ============================================================================
# LDMS collects performance metrics from compute nodes (CPU, memory, network, etc.)
# and streams them to Kafka for storage and analysis.
#
# PREREQUISITE: To enable LDMS support, add the following to software_config.json:
#   {
#     "softwares": [
#       {"name": "ldms", "arch": ["x86_64", "aarch64"]}
#     ]
#   }
#
# When LDMS software is configured, the 'ldms' topic MUST be defined in
# kafka_configurations.topic_partitions above.
#
# LDMS Port Configurations
# Aggregator port on service k8s cluster
# Valid range: 6001-6100
# Default: 6001
ldms_agg_port: 6001

# Store daemon port on service k8s cluster
# Can be the same as ldms_agg_port
# Valid range: 6001-6100
# Default: 6001
ldms_store_port: 6001

# Sampler port on compute nodes
# Valid range: 10001-10100
# Default: 10001
ldms_sampler_port: 10001

# LDMS Sampler Plugin Configurations
# ----------------------------------------------------------------------------
# Configure which metrics to collect from compute nodes and collection intervals.
# Each plugin collects specific system metrics.
#
# Parameters:
#   - plugin_name: Name of the LDMS sampler plugin
#   - config_parameters: Plugin-specific configuration (as a single string)
#   - activation_parameters: Collection schedule in MICROSECONDS
#       Format: "interval=<microseconds> offset=<microseconds>"
#       Example: "interval=1000000"         (1000000 microseconds = 1 second)
#                "interval=1000000 offset=0" (1000000 microseconds with no offset)
#
# Available Plugins:
#   - meminfo: Memory usage statistics
#   - procstat2: Process statistics
#   - vmstat: Virtual memory statistics
#   - loadavg: System load average
#   - procnetdev2: Network interface statistics
ldms_sampler_configurations:
  # Memory usage statistics (free, used, buffers, cached, etc.)
  - plugin_name: meminfo
    config_parameters: ""
    activation_parameters: "interval=1000000"  # interval=1000000 microseconds

  # Process statistics (CPU, memory, I/O per process)
  - plugin_name: procstat2
    config_parameters: ""
    activation_parameters: "interval=1000000"  # interval=1000000 microseconds

  # Virtual memory statistics (paging, swapping, memory pressure)
  - plugin_name: vmstat
    config_parameters: ""
    activation_parameters: "interval=1000000"  # interval=1000000 microseconds

  # System load average (1, 5, and 15 minute averages)
  - plugin_name: loadavg
    config_parameters: ""
    activation_parameters: "interval=1000000"  # interval=1000000 microseconds

  # Network interface statistics (bytes, packets, errors, drops per interface)
  # Config parameters (optional):
  #   - ifaces=eth0,eth1: Specific interfaces to monitor
  #   - If not specified, all network interfaces will be monitored
  - plugin_name: procnetdev2
    config_parameters: ""  # Monitor all interfaces
    activation_parameters: "interval=1000000 offset=0"  # interval=1000000 microseconds, offset=0


================================================
FILE: examples/input_template/bare_metal_slurm/aarch64/without_service_k8s/only_login_node/user_registry_credential.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************
# user_registry credential manager
# name: User registry name, name should match exact name provided in local_repo_config.yml
# username: Provide if user registry requires username to authenticate
# password: Provide if user registry requires password to authenticate

user_registry_credential:
  - {name: "", username: "", password: ""}


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/with_service_k8s/only_login_compiler_node/high_availability_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# ***********************************************************************
# High Availability (HA) Configuration for Kubernetes (K8s) Service Node(List)
# - cluster_name is required field it should match one of the values defined in omnia_config.yml where deployment is set to true.
# - enable_k8s_ha: <Mandatory> Indicates whether to enable HA for the Kubernetes (K8s) service node. Set to 'true' to enable, 'false' to disable.
# - virtual_ip_address: <Mandatory if enable_k8s_ha is true> The virtual IP address for the K8s service node HA setup.
# ***********************************************************************

service_k8s_cluster_ha:
  - cluster_name: service_cluster
    enable_k8s_ha: true
    virtual_ip_address: "172.16.107.1"

================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/with_service_k8s/only_login_compiler_node/local_repo_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# You may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# ================================
# VARIABLE DETAILS
# ================================
# 1. user_repo_url_x86_64
#--------------------------
#    Optional list of user-defined repository URLs for x86_64 architecture.
#    Each entry can include: url, gpgkey, sslcacert, sslclientkey, sslclientcert, name, policy.
#    Used for custom cluster packages like <arch>_slurm_custom.
# Fields:
#   url         : Base URL of the repository
#   gpgkey      : GPG key URL (leave empty to disable gpgcheck; Omnia will trust this repo and user is responsible for its security)
#   name        : Name of the repository
#   sslcacert   : Path to SSL CA certificate (if using SSL)
#   sslclientkey: Path to SSL client key (if using SSL)
#   sslclientcert: Path to SSL client certificate (if using SSL)
#   policy      : Repository policy (always, partial)
# Notes:
#   - Do not use Jinja variables in this configuration.
#   - Omit SSL fields entirely if SSL is not in use.
#   - Its a madatory field in case of slurm_custom with name as '<arch>_slurm_custom'
#
# 2. user_repo_url_aarch64
#---------------------------
#    Same as above but for aarch64 architecture.
#
# 4. rhel_os_url_x86_64
#-----------------------------
#    Mandatory when RHEL subscription is not registered.
#    Contains repository URLs for codeready-builder, baseos, and appstream for x86_64.
# Fields:
#   url         : Base URL of the repository
#   gpgkey      : GPG key URL (leave empty to disable gpgcheck; Omnia will trust this repo and user is responsible for its security)
#   sslcacert   : Path to SSL CA certificate (if using SSL)
#   sslclientkey: Path to SSL client key (if using SSL)
#   sslclientcert: Path to SSL client certificate (if using SSL)
#   policy      : Repository policy if mentioned allowed values (always, partial). IF not mentioned will consider from software_config.json
#   name        : Name of the repository [ Allowed repo names <arch>_codeready-builder, <arch>_appstream, <arch>_baseos
# Notes:
#   - Do not use Jinja variables in this configuration.
#   - Omit SSL fields entirely if SSL is not in use.
#   - RHEL subscription is not registered, All 3 repositories [ <arch>_codeready-builder, <arch>_appstream, <arch>_baseos ]entries
#      are mandatory.
#
# 5. rhel_os_url_aarch64
#----------------------------
#    Same as above but for aarch64 architecture.
#
#### ADVANCE CONFIGURATIONS FOR LOCAL REPO ###
# 6. omnia_repo_url_rhel_x86_64
#-------------------------------
#    Mandatory repository URLs for downloading RPMS for Omnia features on RHEL x86_64.
#    Each entry includes url, gpgkey, and name.
#
# This variable defines all the repo urls from where rpms will be downloaded for omnia features when cluster_os_type is rhel and arch x86_64
# Making incorrect changes to this variable can cause omnia failure. Please edit cautiously.
# Fields:
#  url        : Base URL of the repository.
#  gpgkey     : URL of the GPG key for the repository.
#                   If left empty, gpgcheck=0 for that repository.
#  name       : A unique identifier for the repository or registry.
#
# 7. omnia_repo_url_rhel_aarch64
#--------------------------------
#    Same as above but for RHEL aarch64.

# ================================
# VARIABLES
# ================================
# Example    
# user_repo_url_x86_64:
#  - { url: "", gpgkey: "", sslcacert: "", sslclientkey: "", sslclientcert: "",  name: "x86_64_slurm_custom" }
user_repo_url_x86_64:
user_repo_url_aarch64:
#Example:
# rhel_os_url_x86_64:
#  - { url: "http://crb.com/CRB/x86_64/os/", gpgkey: "http://crb.com/CRB/x86_64/os/RPM-GPG-KEY", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "x86_64_codeready-builder"}
#  - { url: "http://BaseOS.com/BaseOS/x86_64/os/", gpgkey: "http://BaseOS.com/BaseOS/x86_64/os/RPM-GPG-KEY", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "x86_64_baseos"}
#  - { url: "http://AppStream.com/AppStream/x86_64/os/", gpgkey: "http://AppStream.com/AppStream/x86_64/os/RPM-GPG-KEY", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "x86_64_appstream" }
rhel_os_url_x86_64:
rhel_os_url_aarch64:
# Making incorrect changes to this variable can cause omnia failure. Please edit cautiously.
omnia_repo_url_rhel_x86_64:
  - { url: "https://download.docker.com/linux/centos/10/x86_64/stable/", gpgkey: "https://download.docker.com/linux/centos/gpg", name: "docker-ce"}
  - { url: "https://dl.fedoraproject.org/pub/epel/10/Everything/x86_64/", gpgkey: "https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-10", name: "epel"}
  - { url: "https://pkgs.k8s.io/core:/stable:/v1.34/rpm/", gpgkey: "https://pkgs.k8s.io/core:/stable:/v1.34/rpm/repodata/repomd.xml.key", name: "kubernetes"}
  - { url: "https://download.opensuse.org/repositories/isv:/cri-o:/stable:/v1.34/rpm/", gpgkey: "https://download.opensuse.org/repositories/isv:/cri-o:/stable:/v1.34/rpm/repodata/repomd.xml.key'", name: "cri-o"}
omnia_repo_url_rhel_aarch64:
  - { url: "https://download.docker.com/linux/centos/10/aarch64/stable/", gpgkey: "https://download.docker.com/linux/centos/gpg", name: "docker-ce"}
  - { url: "https://dl.fedoraproject.org/pub/epel/10/Everything/aarch64/", gpgkey: "https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-10", name: "epel"}


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/with_service_k8s/only_login_compiler_node/network_spec.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# This file is used to specify the network configuration.
#
# 'admin_network' is a mandatory field, essential for PXE boot and host communication."
#
# The 'admin_network' section contains the following variables:
# - 'oim_nic_name': The name of the interface on the OIM server associated with the admin network.
# - 'netmask_bits': The number of bits in the subnet mask.
# - 'primary_oim_admin_ip': The admin IP address of the OIM server which is configured.
# - 'primary_oim_bmc_ip': The iDRAC  IP address of the OIM server,
#     Mandatory only if idrac_telemetry is set to true and telemetry data needs to be collected from the OIM server.
#     Optional — can be omitted if iDRAC telemetry for the OIM server is not required.
# - 'dynamic_range': The range of dynamic IP addresses available on the admin network.
# - 'dns': The list of external DNS server IP address for the admin network.
# - 'ntp_servers': The list of NTP servers for the admin network. Each NTP server entry should include: 
#     - 'address': The IP address or hostname of the NTP server.
#     - 'type': The type of NTP entry, either 'server' or 'pool'.
#     Example:  
#     ntp_servers:
#       - { address: "172.16.10.80", type: "server" }

Networks:
- admin_network:
    oim_nic_name: "eno1"
    netmask_bits: "24"
    primary_oim_admin_ip: "172.16.107.254"
    primary_oim_bmc_ip: "" 
    dynamic_range: "172.16.107.201-172.16.107.250"
    dns: []
    ntp_servers: []


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/with_service_k8s/only_login_compiler_node/omnia_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# -----------------------------SLURM------------------------------------------------
# slurm_cluster
# List of slurm clusters
# cluster_name is required field

# nfs_storage_name
# Storage name corresponding to the NFS share to be used by slurm cluster 
# This should match with exactly with a entry in storage_config.yml

# config_sources
# defines how the Slurm configuration files are provided to the cluster.
# <conf name>: 
#    <mapping>
# <mapping> Supply the configuration values directly as a key–value map
# The conf files supported by slurm are
# slurm
# cgroup
# gres
# mpi
# helpers
# job_container
# acct_gather
# oci
# plugstack
# topology
# Thes files will be written into the slurm_config directory with .conf suffix

slurm_cluster:
  - cluster_name: slurm_cluster
    nfs_storage_name: nfs_slurm
    # config_sources:
    #   slurm:
    #     SlurmctldTimeout: 60
    #     SlurmdTimeout: 150
    #   cgroup: 
    #     CgroupPlugin: autodetect
    #     AllowedRAMSpace: 100
  
# ----------------------------SERVICE K8S------------------------------------------------------
# For service k8s cluster below parameters are required,(List)
# - cluster_name is required field

# - deployment: Exactly one entry in both the service_k8s_cluster lists must have deployment set to true to indicate where Kubernetes should be deployed.
# Please ensure corresponding cluster entry is added to high_availability_config.yml if deployment is set to true. 

# - Kubernetes SDN network.K8s_cni (Mandatory) - It can either be "calico" or "flannel".Default value assigned is "calico".
# While setting up Kubernetes plugin for RoCE NIC, ensure that this value is set to "flannel"

# - pod_external_ip_range: (Mandatory) These addresses will be used by Loadbalancer for assigning External IPs to K8s services
# Make sure the IP range is not assigned to any node in the cluster.
# Acceptable formats: "10.11.0.100-10.11.0.150" , "10.11.0.0/16"

# - k8s_service_addresses: Kubernetes internal network for services.This network must be unused in your network infrastructure.
# Default value is "10.233.0.0/18"

# - k8s_pod_network_cidr: Kubernetes pod network CIDR for internal network. When used, it will assign IP addresses from this range to individual pods.
# This network must be unused in your network infrastructure.
# Default value is "10.233.64.0/18"

# nfs_storage_name : The nfs name should be same as one of the nfs name defined in storage_config.yml to configure the server.
# ----------------------------CSI Driver------------------------------------------------------
# Following csi powerscale driver input variables are mandatory only if csi_driver_powerscale entry is present in software_config.json
# csi_powerscale_driver_secret_file_path: Absolute file path for the secret.yaml file.
# User need to download secret.yaml file and fill required data in secret file. Provided the path of the secret file here.
# File path for the values.yml file which will contain the Powerscale driver configuration parameters.
# csi_powerscale_driver_values_file_path: User need to download values.yaml file and fill required data in values.yaml file. Provided the path of the values.yaml file here.
# mention configurable values

service_k8s_cluster:
  - cluster_name: service_cluster
    deployment: true
    k8s_cni: "calico"
    pod_external_ip_range: "172.16.107.170-172.16.107.200"
    k8s_service_addresses: "10.233.0.0/18"
    k8s_pod_network_cidr: "10.233.64.0/18"
    nfs_storage_name: "nfs_k8s"
    csi_powerscale_driver_secret_file_path: ""
    csi_powerscale_driver_values_file_path: ""


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/with_service_k8s/only_login_compiler_node/provision_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

#### Mandatory
# This depicts the path where user has kept the PXE mapping file.
# The mapping file consists of the Service tag, Admin MAC,Hostname and its respective admin IP address and/or BMC IP.
# Ensure that admin IPs given in mapping file are within the network defined in the network_spec.yml
# A templates for mapping file exists in omnia/examples, namely, pxe_mapping_file.csv
# Format of csv: FUNCTIONAL_GROUP_NAME,GROUP_NAME,SERVICE_TAG,HOSTNAME,ADMIN_MAC,ADMIN_IP,BMC_MAC,BMC_IP
pxe_mapping_file_path: "/opt/omnia/input/project_default/pxe_mapping_file.csv"

#### Mandatory
# Language that needs to be set during OS provisioning.
# Only language supported is "en_US.UTF-8"
language: "en_US.UTF-8"

#### Mandatory
# Default lease time needs to be used by DHCP
# Unit: seconds
# Min: 21600
# Default: 86400
# Max: 31536000
default_lease_time: "86400"


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/with_service_k8s/only_login_compiler_node/security_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# Connection Type options: TLS or SSL
# Default: TLS (validated)
# If TLS: secure OpenLDAP connection occurs on port 389
# If SSL: secure OpenLDAP connection occurs on port 636
ldap_connection_type: "TLS"


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/with_service_k8s/only_login_compiler_node/software_config.json
================================================
{
    "cluster_os_type": "rhel",
    "cluster_os_version": "10.0",
    "repo_config": "partial",
    "softwares": [
        {"name": "default_packages", "arch": ["x86_64"]},
        {"name": "openldap", "arch": ["x86_64"]},
        {"name": "service_k8s","version": "1.34.1", "arch": ["x86_64"]},
        {"name": "slurm_custom", "arch": ["x86_64"]},
        {"name": "ldms", "arch": ["x86_64"]}
    ],
    "slurm_custom": [
        {"name": "slurm_control_node"},
        {"name": "slurm_node"},
        {"name": "login_node"},
        {"name": "login_compiler_node"}
    ],
    "service_k8s": [
        {"name": "service_kube_control_plane_first"},
        {"name": "service_kube_control_plane"},
        {"name": "service_kube_node"}
    ]

}


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/with_service_k8s/only_login_compiler_node/storage_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# -----------------------------NFS------------------------------------------------

# This variable is used for mounting NFS share on slurm_control_node, slurm_node, login_node
# This takes a list of dicts with possible keys server_ip, server_share_path, client_share_path, client_mount_options
# In both the cases, the USER must manually update 'server_ip' and 'server_share_path' below with the correct values.
# If mount_option values are empty, NFS client will be mounted with these values "nosuid,rw,sync,hard,intr"
# Its mandatory to provide atleast one entry in nfs_client_params
# Example for single mount file system:
# nfs_client_params:
# nfs_name : str ,Name of the NFS storage resource. The default is "nfs_storage_default".
#     The user can assign any custom string to specify a different NFS storage resource.
# - { server_ip: 10.5.0.101, server_share_path: "/mnt/share", client_share_path: "/home", client_mount_options: "nosuid,rw,sync,hard"}
# Example for supporting multiple mount points:
# nfs_client_params:
# - { server_ip: 198.168.0.1,server_share_path: "/mnt/share1", client_share_path: "/home", client_mount_options: "nosuid,rw,sync,hard"}
# - { server_ip: 198.168.0.2, server_share_path: "/mnt/share2", client_share_path: "/mnt/mount2", client_mount_options: "nosuid,rw,sync,hard"}
# Example for multiple mount file system:
# nfs_client_params:
# - { server_ip: 198.168.0.1, server_share_path: "/mnt/share1", client_share_path: "/mnt/mount1", client_mount_options: "nosuid,rw,sync,hard"}
# - { server_ip: 198.168.0.2, server_share_path: "/mnt/share2", client_share_path: "/mnt/mount2", client_mount_options: "nosuid,rw,sync,hard"}
nfs_client_params:
  - server_ip: "172.16.107.168" # Provide the IP of the NFS server
    server_share_path: "/mnt/share/omnia" # Provide server share path of the NFS Server
    client_share_path: /share_omnia
    client_mount_options: "nosuid,rw,sync,hard,intr"
    nfs_name: nfs_slurm

  - server_ip: "172.16.107.121" # Provide the IP of the NFS server
    server_share_path: "/mnt/share/omnia_k8s" # Provide server share path of the NFS Server
    client_share_path: /share_omnia_k8s
    client_mount_options: "nosuid,rw,sync,hard,intr"
    nfs_name: nfs_k8s


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/with_service_k8s/only_login_compiler_node/telemetry_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# ============================================================================
# TELEMETRY CONFIGURATION OVERVIEW
# ============================================================================
# This file configures telemetry data collection and storage for Dell Omnia.
#
# SECTIONS:
#   1. iDRAC Telemetry    : Hardware metrics from Dell PowerEdge servers
#   2. VictoriaMetrics    : Time-series database for metric storage
#   3. Kafka              : Distributed streaming platform for telemetry data
#   4. LDMS               : Lightweight Distributed Metric Service for compute nodes
#
# ============================================================================
# STORAGE REQUIREMENTS SUMMARY
# ============================================================================
# 
# VICTORIAMETRICS STORAGE:
# ┌─────────────────┬──────────────────┬─────────────────┬──────────────────┐
# │ Deployment Mode │ Per-Pod Storage  │ Number of Pods  │ Total Storage    │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Single-node     │ persistence_size │ 1 pod           │ 1× storage       │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Cluster         │ persistence_size │ 3 vmstorage     │ 3× storage       │
# └─────────────────┴──────────────────┴─────────────────┴──────────────────┘
# Example: 8Gi per pod → Single-node: 8Gi total, Cluster: 24Gi total
#
# KAFKA STORAGE:
# ┌─────────────────┬──────────────────┬─────────────────┬──────────────────┐
# │ Component       │ Per-Pod Storage  │ Number of Pods  │ Total Storage    │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Kafka Broker    │ persistence_size │ 3 pods          │ 3× storage       │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Kafka Controller│ persistence_size │ 3 pods          │ 3× storage       │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ TOTAL KAFKA     │ persistence_size │ 6 pods          │ 6× storage       │
# └─────────────────┴──────────────────┴─────────────────┴──────────────────┘
# Example: 8Gi per pod → 48Gi total Kafka storage
#
# COMBINED STORAGE EXAMPLES:
#   Default (8Gi each): VictoriaMetrics Cluster (24Gi) + Kafka (48Gi) = 72Gi total
#   Single-node mode:   VictoriaMetrics Single (8Gi) + Kafka (48Gi) = 56Gi total
#
# STORAGE OPTIONS:
#   - VictoriaMetrics: Store iDRAC telemetry in time-series database
#   - Kafka: Stream iDRAC and LDMS telemetry to Kafka topics
#   - Both: Store iDRAC in both Victoria and Kafka (recommended)
# ============================================================================

# ============================================================================
# iDRAC TELEMETRY CONFIGURATION
# ============================================================================
# iDRAC telemetry collects hardware metrics from Dell PowerEdge servers.
# Telemetry data can be stored in VictoriaMetrics, Kafka, or both.

# Enable or disable iDRAC telemetry support
# Accepted values: true or false
# Default: true
idrac_telemetry_support: true

# Specify where to store iDRAC telemetry data
# Supported values:
#   - "victoria"        : Store in VictoriaMetrics only
#   - "kafka"           : Store in Kafka only
#   - "victoria,kafka"  : Store in both (recommended)
# Default: "victoria,kafka"
idrac_telemetry_collection_type: "victoria,kafka"

# ============================================================================
# VICTORIAMETRICS CONFIGURATION
# ============================================================================
# VictoriaMetrics is a time-series database for storing telemetry metrics.
# Used for iDRAC telemetry when 'victoria' is enabled in idrac_telemetry_collection_type.
#
# DEPLOYMENT MODES:
#   - single-node: Simple deployment with one pod (suitable for small deployments)
#   - cluster: High-availability deployment with multiple components
#               (recommended for production and large-scale deployments)
victoria_configurations:
  # VictoriaMetrics deployment mode
  # Supported values:
  #   - "single-node" : Simple deployment (1 pod, suitable for dev/test)
  #   - "cluster"     : High-availability deployment (7 pods, recommended for production)
  # Default: "cluster"
  #
  # Cluster Mode Benefits:
  #   - High availability (no single point of failure)
  #   - Horizontal scalability (scale components independently)
  #   - Better performance (4x ingestion, 2x query speed)
  #   - Production-ready architecture
  #
  # Single-Node Benefits:
  #   - Simple setup (fewer resources)
  #   - Suitable for small deployments (<10 nodes)
  #   - Lower resource usage (~4Gi memory vs ~10Gi for cluster)
  deployment_mode: "cluster"

  # The amount of storage allocated for EACH VictoriaMetrics persistent volume.
  # IMPORTANT: Total VictoriaMetrics storage depends on deployment mode:
  #   - Single-node mode: Total storage = persistence_size × 1 pod
  #   - Cluster mode: Total storage = persistence_size × 3 vmstorage pods
  #   - Example (cluster): 8Gi × 3 = 24Gi total VictoriaMetrics storage
  # Accepted values: in the form of "X[Ki|Mi|Gi|Ti|Pi|Ei]"
  # Default: 8Gi (results in 24Gi total storage for cluster mode)
  persistence_size: "8Gi"

  # Duration (in hours) to retain victoria logs before they are deleted.
  # Default: 168 (7 days)
  retention_period: 168

# ============================================================================
# KAFKA CONFIGURATION
# ============================================================================
# Apache Kafka is a distributed streaming platform for storing telemetry data.
# Used for iDRAC telemetry when 'kafka' is enabled in idrac_telemetry_collection_type.
# Also used for LDMS telemetry when LDMS software is configured.
#
# NOTE: Kafka topics are auto-generated based on enabled features:
#   - 'idrac' topic: Required when idrac_telemetry_support=true and 'kafka' is enabled
#   - 'ldms' topic:  Required when LDMS is configured in software_config.json
kafka_configurations:
  # The amount of storage allocated for EACH Kafka persistent volume.
  # IMPORTANT: Total Kafka storage = persistence_size × 6 pods
  #   - 3 Kafka brokers (each gets persistence_size storage)
  #   - 3 Kafka controllers (each gets persistence_size storage)
  #   - Example: 8Gi × 6 = 48Gi total Kafka storage
  # Accepted values: in the form of "X[Ki|Mi|Gi|Ti|Pi|Ei]"
  # Default: 8Gi (results in 48Gi total storage)
  persistence_size: "8Gi"

  # The number of hours to retain Kafka logs before they are deleted.
  # Default: 168 (7 days)
  log_retention_hours: 168

  # The maximum size of Kafka logs (in bytes) before they are deleted.
  # Default: -1 (unlimited)
  log_retention_bytes: -1

  # The maximum size of Kafka log segments (in bytes) before they are deleted.
  # Default: 1073741824 (1 GB)
  log_segment_bytes: 1073741824

  # Kafka Topic Partitions Configuration
  # ----------------------------------------------------------------------------
  # Define the number of partitions for each Kafka topic.
  # Increasing partitions can improve throughput but also increases storage/overhead.
  #
  # IMPORTANT: Topic names are FIXED and cannot be changed.
  #   - Topic names: Only 'idrac' and 'ldms' are allowed
  #   - Configurable: Only partition counts can be modified
  #
  # Topic Requirements (auto-validated):
  #   - 'idrac': Required when idrac_telemetry_support=true and 'kafka' is enabled
  #   - 'ldms':  Required when LDMS software is configured in software_config.json
  #
  # Default partition counts: idrac=1, ldms=2
  topic_partitions:
    - name: "idrac"
      partitions: 1
    - name: "ldms"
      partitions: 2

# ============================================================================
# LDMS (Lightweight Distributed Metric Service) CONFIGURATION
# ============================================================================
# LDMS collects performance metrics from compute nodes (CPU, memory, network, etc.)
# and streams them to Kafka for storage and analysis.
#
# PREREQUISITE: To enable LDMS support, add the following to software_config.json:
#   {
#     "softwares": [
#       {"name": "ldms", "arch": ["x86_64", "aarch64"]}
#     ]
#   }
#
# When LDMS software is configured, the 'ldms' topic MUST be defined in
# kafka_configurations.topic_partitions above.
#
# LDMS Port Configurations
# Aggregator port on service k8s cluster
# Valid range: 6001-6100
# Default: 6001
ldms_agg_port: 6001

# Store daemon port on service k8s cluster
# Can be the same as ldms_agg_port
# Valid range: 6001-6100
# Default: 6001
ldms_store_port: 6001

# Sampler port on compute nodes
# Valid range: 10001-10100
# Default: 10001
ldms_sampler_port: 10001

# LDMS Sampler Plugin Configurations
# ----------------------------------------------------------------------------
# Configure which metrics to collect from compute nodes and collection intervals.
# Each plugin collects specific system metrics.
#
# Parameters:
#   - plugin_name: Name of the LDMS sampler plugin
#   - config_parameters: Plugin-specific configuration (as a single string)
#   - activation_parameters: Collection schedule in MICROSECONDS
#       Format: "interval=<microseconds> offset=<microseconds>"
#       Example: "interval=1000000"         (1000000 microseconds = 1 second)
#                "interval=1000000 offset=0" (1000000 microseconds with no offset)
#
# Available Plugins:
#   - meminfo: Memory usage statistics
#   - procstat2: Process statistics
#   - vmstat: Virtual memory statistics
#   - loadavg: System load average
#   - procnetdev2: Network interface statistics
ldms_sampler_configurations:
  # Memory usage statistics (free, used, buffers, cached, etc.)
  - plugin_name: meminfo
    config_parameters: ""
    activation_parameters: "interval=1000000"  # interval=1000000 microseconds

  # Process statistics (CPU, memory, I/O per process)
  - plugin_name: procstat2
    config_parameters: ""
    activation_parameters: "interval=1000000"  # interval=1000000 microseconds

  # Virtual memory statistics (paging, swapping, memory pressure)
  - plugin_name: vmstat
    config_parameters: ""
    activation_parameters: "interval=1000000"  # interval=1000000 microseconds

  # System load average (1, 5, and 15 minute averages)
  - plugin_name: loadavg
    config_parameters: ""
    activation_parameters: "interval=1000000"  # interval=1000000 microseconds

  # Network interface statistics (bytes, packets, errors, drops per interface)
  # Config parameters (optional):
  #   - ifaces=eth0,eth1: Specific interfaces to monitor
  #   - If not specified, all network interfaces will be monitored
  - plugin_name: procnetdev2
    config_parameters: ""  # Monitor all interfaces
    activation_parameters: "interval=1000000 offset=0"  # interval=1000000 microseconds, offset=0


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/with_service_k8s/only_login_compiler_node/user_registry_credential.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************
# user_registry credential manager
# name: User registry name, name should match exact name provided in local_repo_config.yml
# username: Provide if user registry requires username to authenticate
# password: Provide if user registry requires password to authenticate

user_registry_credential:
  - {name: "", username: "", password: ""}


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/with_service_k8s/only_login_node/high_availability_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# ***********************************************************************
# High Availability (HA) Configuration for Kubernetes (K8s) Service Node(List)
# - cluster_name is required field it should match one of the values defined in omnia_config.yml where deployment is set to true.
# - enable_k8s_ha: <Mandatory> Indicates whether to enable HA for the Kubernetes (K8s) service node. Set to 'true' to enable, 'false' to disable.
# - virtual_ip_address: <Mandatory if enable_k8s_ha is true> The virtual IP address for the K8s service node HA setup.
# ***********************************************************************

service_k8s_cluster_ha:
  - cluster_name: service_cluster
    enable_k8s_ha: true
    virtual_ip_address: "172.16.107.1"

================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/with_service_k8s/only_login_node/local_repo_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# You may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# ================================
# VARIABLE DETAILS
# ================================
# 1. user_repo_url_x86_64
#--------------------------
#    Optional list of user-defined repository URLs for x86_64 architecture.
#    Each entry can include: url, gpgkey, sslcacert, sslclientkey, sslclientcert, name, policy.
#    Used for custom cluster packages like <arch>_slurm_custom.
# Fields:
#   url         : Base URL of the repository
#   gpgkey      : GPG key URL (leave empty to disable gpgcheck; Omnia will trust this repo and user is responsible for its security)
#   name        : Name of the repository
#   sslcacert   : Path to SSL CA certificate (if using SSL)
#   sslclientkey: Path to SSL client key (if using SSL)
#   sslclientcert: Path to SSL client certificate (if using SSL)
#   policy      : Repository policy (always, partial)
# Notes:
#   - Do not use Jinja variables in this configuration.
#   - Omit SSL fields entirely if SSL is not in use.
#   - Its a madatory field in case of slurm_custom with name as '<arch>_slurm_custom'
#
# 2. user_repo_url_aarch64
#---------------------------
#    Same as above but for aarch64 architecture.
#
# 4. rhel_os_url_x86_64
#-----------------------------
#    Mandatory when RHEL subscription is not registered.
#    Contains repository URLs for codeready-builder, baseos, and appstream for x86_64.
# Fields:
#   url         : Base URL of the repository
#   gpgkey      : GPG key URL (leave empty to disable gpgcheck; Omnia will trust this repo and user is responsible for its security)
#   sslcacert   : Path to SSL CA certificate (if using SSL)
#   sslclientkey: Path to SSL client key (if using SSL)
#   sslclientcert: Path to SSL client certificate (if using SSL)
#   policy      : Repository policy if mentioned allowed values (always, partial). IF not mentioned will consider from software_config.json
#   name        : Name of the repository [ Allowed repo names <arch>_codeready-builder, <arch>_appstream, <arch>_baseos
# Notes:
#   - Do not use Jinja variables in this configuration.
#   - Omit SSL fields entirely if SSL is not in use.
#   - RHEL subscription is not registered, All 3 repositories [ <arch>_codeready-builder, <arch>_appstream, <arch>_baseos ]entries
#      are mandatory.
#
# 5. rhel_os_url_aarch64
#----------------------------
#    Same as above but for aarch64 architecture.
#
#### ADVANCE CONFIGURATIONS FOR LOCAL REPO ###
# 6. omnia_repo_url_rhel_x86_64
#-------------------------------
#    Mandatory repository URLs for downloading RPMS for Omnia features on RHEL x86_64.
#    Each entry includes url, gpgkey, and name.
#
# This variable defines all the repo urls from where rpms will be downloaded for omnia features when cluster_os_type is rhel and arch x86_64
# Making incorrect changes to this variable can cause omnia failure. Please edit cautiously.
# Fields:
#  url        : Base URL of the repository.
#  gpgkey     : URL of the GPG key for the repository.
#                   If left empty, gpgcheck=0 for that repository.
#  name       : A unique identifier for the repository or registry.
#
# 7. omnia_repo_url_rhel_aarch64
#--------------------------------
#    Same as above but for RHEL aarch64.

# ================================
# VARIABLES
# ================================
# Example    
# user_repo_url_x86_64:
#  - { url: "", gpgkey: "", sslcacert: "", sslclientkey: "", sslclientcert: "",  name: "x86_64_slurm_custom" }
user_repo_url_x86_64:
user_repo_url_aarch64:
#Example:
# rhel_os_url_x86_64:
#  - { url: "http://crb.com/CRB/x86_64/os/", gpgkey: "http://crb.com/CRB/x86_64/os/RPM-GPG-KEY", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "x86_64_codeready-builder"}
#  - { url: "http://BaseOS.com/BaseOS/x86_64/os/", gpgkey: "http://BaseOS.com/BaseOS/x86_64/os/RPM-GPG-KEY", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "x86_64_baseos"}
#  - { url: "http://AppStream.com/AppStream/x86_64/os/", gpgkey: "http://AppStream.com/AppStream/x86_64/os/RPM-GPG-KEY", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "x86_64_appstream" }
rhel_os_url_x86_64:
rhel_os_url_aarch64:
# Making incorrect changes to this variable can cause omnia failure. Please edit cautiously.
omnia_repo_url_rhel_x86_64:
  - { url: "https://download.docker.com/linux/centos/10/x86_64/stable/", gpgkey: "https://download.docker.com/linux/centos/gpg", name: "docker-ce"}
  - { url: "https://dl.fedoraproject.org/pub/epel/10/Everything/x86_64/", gpgkey: "https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-10", name: "epel"}
  - { url: "https://pkgs.k8s.io/core:/stable:/v1.34/rpm/", gpgkey: "https://pkgs.k8s.io/core:/stable:/v1.34/rpm/repodata/repomd.xml.key", name: "kubernetes"}
  - { url: "https://download.opensuse.org/repositories/isv:/cri-o:/stable:/v1.34/rpm/", gpgkey: "https://download.opensuse.org/repositories/isv:/cri-o:/stable:/v1.34/rpm/repodata/repomd.xml.key'", name: "cri-o"}
omnia_repo_url_rhel_aarch64:
  - { url: "https://download.docker.com/linux/centos/10/aarch64/stable/", gpgkey: "https://download.docker.com/linux/centos/gpg", name: "docker-ce"}
  - { url: "https://dl.fedoraproject.org/pub/epel/10/Everything/aarch64/", gpgkey: "https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-10", name: "epel"}


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/with_service_k8s/only_login_node/network_spec.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# This file is used to specify the network configuration.
#
# 'admin_network' is a mandatory field, essential for PXE boot and host communication."
#
# The 'admin_network' section contains the following variables:
# - 'oim_nic_name': The name of the interface on the OIM server associated with the admin network.
# - 'netmask_bits': The number of bits in the subnet mask.
# - 'primary_oim_admin_ip': The admin IP address of the OIM server which is configured.
# - 'primary_oim_bmc_ip': The iDRAC  IP address of the OIM server,
#     Mandatory only if idrac_telemetry is set to true and telemetry data needs to be collected from the OIM server.
#     Optional — can be omitted if iDRAC telemetry for the OIM server is not required.
# - 'dynamic_range': The range of dynamic IP addresses available on the admin network.
# - 'dns': The list of external DNS server IP address for the admin network.
# - 'ntp_servers': The list of NTP servers for the admin network. Each NTP server entry should include: 
#     - 'address': The IP address or hostname of the NTP server.
#     - 'type': The type of NTP entry, either 'server' or 'pool'.
#     Example:  
#     ntp_servers:
#       - { address: "172.16.10.80", type: "server" }

Networks:
- admin_network:
    oim_nic_name: "eno1"
    netmask_bits: "24"
    primary_oim_admin_ip: "172.16.107.254"
    primary_oim_bmc_ip: "" 
    dynamic_range: "172.16.107.201-172.16.107.250"
    dns: []
    ntp_servers: []


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/with_service_k8s/only_login_node/omnia_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# -----------------------------SLURM------------------------------------------------
# slurm_cluster
# List of slurm clusters
# cluster_name is required field

# nfs_storage_name
# Storage name corresponding to the NFS share to be used by slurm cluster 
# This should match with exactly with a entry in storage_config.yml

# config_sources
# defines how the Slurm configuration files are provided to the cluster.
# <conf name>: 
#    <mapping>
# <mapping> Supply the configuration values directly as a key–value map
# The conf files supported by slurm are
# slurm
# cgroup
# gres
# mpi
# helpers
# job_container
# acct_gather
# oci
# plugstack
# topology
# Thes files will be written into the slurm_config directory with .conf suffix

slurm_cluster:
  - cluster_name: slurm_cluster
    nfs_storage_name: nfs_slurm
    # config_sources:
    #   slurm:
    #     SlurmctldTimeout: 60
    #     SlurmdTimeout: 150
    #   cgroup: 
    #     CgroupPlugin: autodetect
    #     AllowedRAMSpace: 100
  
# ----------------------------SERVICE K8S------------------------------------------------------
# For service k8s cluster below parameters are required,(List)
# - cluster_name is required field

# - deployment: Exactly one entry in both the service_k8s_cluster lists must have deployment set to true to indicate where Kubernetes should be deployed.
# Please ensure corresponding cluster entry is added to high_availability_config.yml if deployment is set to true. 

# - Kubernetes SDN network.K8s_cni (Mandatory) - It can either be "calico" or "flannel".Default value assigned is "calico".
# While setting up Kubernetes plugin for RoCE NIC, ensure that this value is set to "flannel"

# - pod_external_ip_range: (Mandatory) These addresses will be used by Loadbalancer for assigning External IPs to K8s services
# Make sure the IP range is not assigned to any node in the cluster.
# Acceptable formats: "10.11.0.100-10.11.0.150" , "10.11.0.0/16"

# - k8s_service_addresses: Kubernetes internal network for services.This network must be unused in your network infrastructure.
# Default value is "10.233.0.0/18"

# - k8s_pod_network_cidr: Kubernetes pod network CIDR for internal network. When used, it will assign IP addresses from this range to individual pods.
# This network must be unused in your network infrastructure.
# Default value is "10.233.64.0/18"

# nfs_storage_name : The nfs name should be same as one of the nfs name defined in storage_config.yml to configure the server.
# ----------------------------CSI Driver------------------------------------------------------
# Following csi powerscale driver input variables are mandatory only if csi_driver_powerscale entry is present in software_config.json
# csi_powerscale_driver_secret_file_path: Absolute file path for the secret.yaml file.
# User need to download secret.yaml file and fill required data in secret file. Provided the path of the secret file here.
# File path for the values.yml file which will contain the Powerscale driver configuration parameters.
# csi_powerscale_driver_values_file_path: User need to download values.yaml file and fill required data in values.yaml file. Provided the path of the values.yaml file here.
# mention configurable values

service_k8s_cluster:
  - cluster_name: service_cluster
    deployment: true
    k8s_cni: "calico"
    pod_external_ip_range: "172.16.107.170-172.16.107.200"
    k8s_service_addresses: "10.233.0.0/18"
    k8s_pod_network_cidr: "10.233.64.0/18"
    nfs_storage_name: "nfs_k8s"
    csi_powerscale_driver_secret_file_path: ""
    csi_powerscale_driver_values_file_path: ""


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/with_service_k8s/only_login_node/provision_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

#### Mandatory
# This depicts the path where user has kept the PXE mapping file.
# The mapping file consists of the Service tag, Admin MAC,Hostname and its respective admin IP address and/or BMC IP.
# Ensure that admin IPs given in mapping file are within the network defined in the network_spec.yml
# A templates for mapping file exists in omnia/examples, namely, pxe_mapping_file.csv
# Format of csv: FUNCTIONAL_GROUP_NAME,GROUP_NAME,SERVICE_TAG,HOSTNAME,ADMIN_MAC,ADMIN_IP,BMC_MAC,BMC_IP
pxe_mapping_file_path: "/opt/omnia/input/project_default/pxe_mapping_file.csv"

#### Mandatory
# Language that needs to be set during OS provisioning.
# Only language supported is "en_US.UTF-8"
language: "en_US.UTF-8"

#### Mandatory
# Default lease time needs to be used by DHCP
# Unit: seconds
# Min: 21600
# Default: 86400
# Max: 31536000
default_lease_time: "86400"


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/with_service_k8s/only_login_node/security_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# Connection Type options: TLS or SSL
# Default: TLS (validated)
# If TLS: secure OpenLDAP connection occurs on port 389
# If SSL: secure OpenLDAP connection occurs on port 636
ldap_connection_type: "TLS"


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/with_service_k8s/only_login_node/software_config.json
================================================
{
    "cluster_os_type": "rhel",
    "cluster_os_version": "10.0",
    "repo_config": "partial",
    "softwares": [
        {"name": "default_packages", "arch": ["x86_64"]},
        {"name": "openldap", "arch": ["x86_64"]},
        {"name": "service_k8s","version": "1.34.1", "arch": ["x86_64"]},
        {"name": "slurm_custom", "arch": ["x86_64"]},
        {"name": "ldms", "arch": ["x86_64"]}
    ],
    "slurm_custom": [
        {"name": "slurm_control_node"},
        {"name": "slurm_node"},
        {"name": "login_node"}    
    ],
    "service_k8s": [
        {"name": "service_kube_control_plane_first"},
        {"name": "service_kube_control_plane"},
        {"name": "service_kube_node"}
    ]

}


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/with_service_k8s/only_login_node/storage_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# -----------------------------NFS------------------------------------------------

# This variable is used for mounting NFS share on slurm_control_node, slurm_node, login_node
# This takes a list of dicts with possible keys server_ip, server_share_path, client_share_path, client_mount_options
# In both the cases, the USER must manually update 'server_ip' and 'server_share_path' below with the correct values.
# If mount_option values are empty, NFS client will be mounted with these values "nosuid,rw,sync,hard,intr"
# Its mandatory to provide atleast one entry in nfs_client_params
# Example for single mount file system:
# nfs_client_params:
# nfs_name : str ,Name of the NFS storage resource. The default is "nfs_storage_default".
#     The user can assign any custom string to specify a different NFS storage resource.
# - { server_ip: 10.5.0.101, server_share_path: "/mnt/share", client_share_path: "/home", client_mount_options: "nosuid,rw,sync,hard"}
# Example for supporting multiple mount points:
# nfs_client_params:
# - { server_ip: 198.168.0.1,server_share_path: "/mnt/share1", client_share_path: "/home", client_mount_options: "nosuid,rw,sync,hard"}
# - { server_ip: 198.168.0.2, server_share_path: "/mnt/share2", client_share_path: "/mnt/mount2", client_mount_options: "nosuid,rw,sync,hard"}
# Example for multiple mount file system:
# nfs_client_params:
# - { server_ip: 198.168.0.1, server_share_path: "/mnt/share1", client_share_path: "/mnt/mount1", client_mount_options: "nosuid,rw,sync,hard"}
# - { server_ip: 198.168.0.2, server_share_path: "/mnt/share2", client_share_path: "/mnt/mount2", client_mount_options: "nosuid,rw,sync,hard"}
nfs_client_params:
  - server_ip: "172.16.107.168" # Provide the IP of the NFS server
    server_share_path: "/mnt/share/omnia" # Provide server share path of the NFS Server
    client_share_path: /share_omnia
    client_mount_options: "nosuid,rw,sync,hard,intr"
    nfs_name: nfs_slurm

  - server_ip: "172.16.107.121" # Provide the IP of the NFS server
    server_share_path: "/mnt/share/omnia_k8s" # Provide server share path of the NFS Server
    client_share_path: /share_omnia_k8s
    client_mount_options: "nosuid,rw,sync,hard,intr"
    nfs_name: nfs_k8s


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/with_service_k8s/only_login_node/telemetry_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# ============================================================================
# TELEMETRY CONFIGURATION OVERVIEW
# ============================================================================
# This file configures telemetry data collection and storage for Dell Omnia.
#
# SECTIONS:
#   1. iDRAC Telemetry    : Hardware metrics from Dell PowerEdge servers
#   2. VictoriaMetrics    : Time-series database for metric storage
#   3. Kafka              : Distributed streaming platform for telemetry data
#   4. LDMS               : Lightweight Distributed Metric Service for compute nodes
#
# ============================================================================
# STORAGE REQUIREMENTS SUMMARY
# ============================================================================
# 
# VICTORIAMETRICS STORAGE:
# ┌─────────────────┬──────────────────┬─────────────────┬──────────────────┐
# │ Deployment Mode │ Per-Pod Storage  │ Number of Pods  │ Total Storage    │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Single-node     │ persistence_size │ 1 pod           │ 1× storage       │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Cluster         │ persistence_size │ 3 vmstorage     │ 3× storage       │
# └─────────────────┴──────────────────┴─────────────────┴──────────────────┘
# Example: 8Gi per pod → Single-node: 8Gi total, Cluster: 24Gi total
#
# KAFKA STORAGE:
# ┌─────────────────┬──────────────────┬─────────────────┬──────────────────┐
# │ Component       │ Per-Pod Storage  │ Number of Pods  │ Total Storage    │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Kafka Broker    │ persistence_size │ 3 pods          │ 3× storage       │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Kafka Controller│ persistence_size │ 3 pods          │ 3× storage       │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ TOTAL KAFKA     │ persistence_size │ 6 pods          │ 6× storage       │
# └─────────────────┴──────────────────┴─────────────────┴──────────────────┘
# Example: 8Gi per pod → 48Gi total Kafka storage
#
# COMBINED STORAGE EXAMPLES:
#   Default (8Gi each): VictoriaMetrics Cluster (24Gi) + Kafka (48Gi) = 72Gi total
#   Single-node mode:   VictoriaMetrics Single (8Gi) + Kafka (48Gi) = 56Gi total
#
# STORAGE OPTIONS:
#   - VictoriaMetrics: Store iDRAC telemetry in time-series database
#   - Kafka: Stream iDRAC and LDMS telemetry to Kafka topics
#   - Both: Store iDRAC in both Victoria and Kafka (recommended)
# ============================================================================

# ============================================================================
# iDRAC TELEMETRY CONFIGURATION
# ============================================================================
# iDRAC telemetry collects hardware metrics from Dell PowerEdge servers.
# Telemetry data can be stored in VictoriaMetrics, Kafka, or both.

# Enable or disable iDRAC telemetry support
# Accepted values: true or false
# Default: true
idrac_telemetry_support: true

# Specify where to store iDRAC telemetry data
# Supported values:
#   - "victoria"        : Store in VictoriaMetrics only
#   - "kafka"           : Store in Kafka only
#   - "victoria,kafka"  : Store in both (recommended)
# Default: "victoria,kafka"
idrac_telemetry_collection_type: "victoria,kafka"

# ============================================================================
# VICTORIAMETRICS CONFIGURATION
# ============================================================================
# VictoriaMetrics is a time-series database for storing telemetry metrics.
# Used for iDRAC telemetry when 'victoria' is enabled in idrac_telemetry_collection_type.
#
# DEPLOYMENT MODES:
#   - single-node: Simple deployment with one pod (suitable for small deployments)
#   - cluster: High-availability deployment with multiple components
#               (recommended for production and large-scale deployments)
victoria_configurations:
  # VictoriaMetrics deployment mode
  # Supported values:
  #   - "single-node" : Simple deployment (1 pod, suitable for dev/test)
  #   - "cluster"     : High-availability deployment (7 pods, recommended for production)
  # Default: "cluster"
  #
  # Cluster Mode Benefits:
  #   - High availability (no single point of failure)
  #   - Horizontal scalability (scale components independently)
  #   - Better performance (4x ingestion, 2x query speed)
  #   - Production-ready architecture
  #
  # Single-Node Benefits:
  #   - Simple setup (fewer resources)
  #   - Suitable for small deployments (<10 nodes)
  #   - Lower resource usage (~4Gi memory vs ~10Gi for cluster)
  deployment_mode: "cluster"

  # The amount of storage allocated for EACH VictoriaMetrics persistent volume.
  # IMPORTANT: Total VictoriaMetrics storage depends on deployment mode:
  #   - Single-node mode: Total storage = persistence_size × 1 pod
  #   - Cluster mode: Total storage = persistence_size × 3 vmstorage pods
  #   - Example (cluster): 8Gi × 3 = 24Gi total VictoriaMetrics storage
  # Accepted values: in the form of "X[Ki|Mi|Gi|Ti|Pi|Ei]"
  # Default: 8Gi (results in 24Gi total storage for cluster mode)
  persistence_size: "8Gi"

  # Duration (in hours) to retain victoria logs before they are deleted.
  # Default: 168 (7 days)
  retention_period: 168

# ============================================================================
# KAFKA CONFIGURATION
# ============================================================================
# Apache Kafka is a distributed streaming platform for storing telemetry data.
# Used for iDRAC telemetry when 'kafka' is enabled in idrac_telemetry_collection_type.
# Also used for LDMS telemetry when LDMS software is configured.
#
# NOTE: Kafka topics are auto-generated based on enabled features:
#   - 'idrac' topic: Required when idrac_telemetry_support=true and 'kafka' is enabled
#   - 'ldms' topic:  Required when LDMS is configured in software_config.json
kafka_configurations:
  # The amount of storage allocated for EACH Kafka persistent volume.
  # IMPORTANT: Total Kafka storage = persistence_size × 6 pods
  #   - 3 Kafka brokers (each gets persistence_size storage)
  #   - 3 Kafka controllers (each gets persistence_size storage)
  #   - Example: 8Gi × 6 = 48Gi total Kafka storage
  # Accepted values: in the form of "X[Ki|Mi|Gi|Ti|Pi|Ei]"
  # Default: 8Gi (results in 48Gi total storage)
  persistence_size: "8Gi"

  # The number of hours to retain Kafka logs before they are deleted.
  # Default: 168 (7 days)
  log_retention_hours: 168

  # The maximum size of Kafka logs (in bytes) before they are deleted.
  # Default: -1 (unlimited)
  log_retention_bytes: -1

  # The maximum size of Kafka log segments (in bytes) before they are deleted.
  # Default: 1073741824 (1 GB)
  log_segment_bytes: 1073741824

  # Kafka Topic Partitions Configuration
  # ----------------------------------------------------------------------------
  # Define the number of partitions for each Kafka topic.
  # Increasing partitions can improve throughput but also increases storage/overhead.
  #
  # IMPORTANT: Topic names are FIXED and cannot be changed.
  #   - Topic names: Only 'idrac' and 'ldms' are allowed
  #   - Configurable: Only partition counts can be modified
  #
  # Topic Requirements (auto-validated):
  #   - 'idrac': Required when idrac_telemetry_support=true and 'kafka' is enabled
  #   - 'ldms':  Required when LDMS software is configured in software_config.json
  #
  # Default partition counts: idrac=1, ldms=2
  topic_partitions:
    - name: "idrac"
      partitions: 1
    - name: "ldms"
      partitions: 2

# ============================================================================
# LDMS (Lightweight Distributed Metric Service) CONFIGURATION
# ============================================================================
# LDMS collects performance metrics from compute nodes (CPU, memory, network, etc.)
# and streams them to Kafka for storage and analysis.
#
# PREREQUISITE: To enable LDMS support, add the following to software_config.json:
#   {
#     "softwares": [
#       {"name": "ldms", "arch": ["x86_64", "aarch64"]}
#     ]
#   }
#
# When LDMS software is configured, the 'ldms' topic MUST be defined in
# kafka_configurations.topic_partitions above.
#
# LDMS Port Configurations
# Aggregator port on service k8s cluster
# Valid range: 6001-6100
# Default: 6001
ldms_agg_port: 6001

# Store daemon port on service k8s cluster
# Can be the same as ldms_agg_port
# Valid range: 6001-6100
# Default: 6001
ldms_store_port: 6001

# Sampler port on compute nodes
# Valid range: 10001-10100
# Default: 10001
ldms_sampler_port: 10001

# LDMS Sampler Plugin Configurations
# ----------------------------------------------------------------------------
# Configure which metrics to collect from compute nodes and collection intervals.
# Each plugin collects specific system metrics.
#
# Parameters:
#   - plugin_name: Name of the LDMS sampler plugin
#   - config_parameters: Plugin-specific configuration (as a single string)
#   - activation_parameters: Collection schedule in MICROSECONDS
#       Format: "interval=<microseconds> offset=<microseconds>"
#       Example: "interval=1000000"         (1000000 microseconds = 1 second)
#                "interval=1000000 offset=0" (1000000 microseconds with no offset)
#
# Available Plugins:
#   - meminfo: Memory usage statistics
#   - procstat2: Process statistics
#   - vmstat: Virtual memory statistics
#   - loadavg: System load average
#   - procnetdev2: Network interface statistics
ldms_sampler_configurations:
  # Memory usage statistics (free, used, buffers, cached, etc.)
  - plugin_name: meminfo
    config_parameters: ""
    activation_parameters: "interval=1000000"  # interval=1000000 microseconds

  # Process statistics (CPU, memory, I/O per process)
  - plugin_name: procstat2
    config_parameters: ""
    activation_parameters: "interval=1000000"  # interval=1000000 microseconds

  # Virtual memory statistics (paging, swapping, memory pressure)
  - plugin_name: vmstat
    config_parameters: ""
    activation_parameters: "interval=1000000"  # interval=1000000 microseconds

  # System load average (1, 5, and 15 minute averages)
  - plugin_name: loadavg
    config_parameters: ""
    activation_parameters: "interval=1000000"  # interval=1000000 microseconds

  # Network interface statistics (bytes, packets, errors, drops per interface)
  # Config parameters (optional):
  #   - ifaces=eth0,eth1: Specific interfaces to monitor
  #   - If not specified, all network interfaces will be monitored
  - plugin_name: procnetdev2
    config_parameters: ""  # Monitor all interfaces
    activation_parameters: "interval=1000000 offset=0"  # interval=1000000 microseconds, offset=0


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/with_service_k8s/only_login_node/user_registry_credential.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************
# user_registry credential manager
# name: User registry name, name should match exact name provided in local_repo_config.yml
# username: Provide if user registry requires username to authenticate
# password: Provide if user registry requires password to authenticate

user_registry_credential:
  - {name: "", username: "", password: ""}


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/without_service_k8s/only_login_compiler_node/high_availability_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# ***********************************************************************
# High Availability (HA) Configuration for Kubernetes (K8s) Service Node(List)
# - cluster_name is required field it should match one of the values defined in omnia_config.yml where deployment is set to true.
# - enable_k8s_ha: <Mandatory> Indicates whether to enable HA for the Kubernetes (K8s) service node. Set to 'true' to enable, 'false' to disable.
# - virtual_ip_address: <Mandatory if enable_k8s_ha is true> The virtual IP address for the K8s service node HA setup.
# ***********************************************************************

service_k8s_cluster_ha:
  - cluster_name: service_cluster
    enable_k8s_ha: true
    virtual_ip_address: "172.16.107.1"

================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/without_service_k8s/only_login_compiler_node/local_repo_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************
# By default, set to false to enable secure (HTTP) connection to the Pulp server.
# Update to true if required to connect to the Pulp server using HTTPS.
pulp_protocol_https: true

# Optional
# User-defined repository URLs for x86_64 architecture containing cluster packages.
# Ensure sufficient disk space is available.
# Fields:
#   url         : Base URL of the repository
#   gpgkey      : GPG key URL (leave empty to disable gpgcheck; Omnia will trust this repo and user is responsible for its security)
#   name        : Name of the repository
#   sslcacert   : Path to SSL CA certificate (if using SSL)
#   sslclientkey: Path to SSL client key (if using SSL)
#   sslclientcert: Path to SSL client certificate (if using SSL)
#   policy      : Repository policy (always, partial)
# Notes:
#   - Do not use Jinja variables in this configuration.
#   - Omit SSL fields entirely if SSL is not in use.
#   - Its a madatory field in case of slurm_custom with name as '<arch>_slurm_custom'
# Example    
# user_repo_url_x86_64:
#  - { url: "", gpgkey: "", sslcacert: "", sslclientkey: "", sslclientcert: "",  name: "x86_64_slurm_custom" }
user_repo_url_x86_64:

# user_repo_url_aarch64:
#   - { url: "", gpgkey: "", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "aarch64_slurm_custom" }
user_repo_url_aarch64:

# Optional
# This variable defines a list of user-provided container registries containing images required for the cluster.
# Users must ensure sufficient disk space is available for image storage.
#
# Each registry entry accepts the following fields:
# - host: The registry URL/hostname (e.g., 10.11.0.100/abcd.dev.test).
# - cert_path: Absolute path to the CA certificate file for the registry. If empty, the registry is treated as insecure.
# - key_path: Path to the client key file, if required by the registry.
# - name: A unique identifier for the registry.
# - requires_auth: Set to true if the registry requires authentication with username/password, otherwise false.
#
# Example:
# user_registry:
#   - { host: 10.11.0.100, cert_path: "/home/ca.crt", key_path: "", name: "local", requires_auth: true }
#   - { host: hostname.registry.test, cert_path: "", key_path: "", name: "external", requires_auth: false }
user_registry:

# Mandatory when cluster_os_type is rhel in softwares_config.json and RHEL subscription is not registered 
# User has to provide the code ready builder , baseos, appstream urls that should not have a RedHat subscription authentication in order to download the packages
# and the rhel_os_url configured via proxy in compute nodes
# User must configure them for the respective architecture (x86_64 or aarch64)
# Fields:
#   url         : Base URL of the repository
#   gpgkey      : GPG key URL (leave empty to disable gpgcheck; Omnia will trust this repo and user is responsible for its security)
#   sslcacert   : Path to SSL CA certificate (if using SSL)
#   sslclientkey: Path to SSL client key (if using SSL)
#   sslclientcert: Path to SSL client certificate (if using SSL)
#   policy      : Repository policy if mentioned allowed values (always, partial). IF not mentioned will consider from software_config.json
#   name        : Name of the repository [ Allowed repo names <arch>_codeready-builder, <arch>_appstream, <arch>_baseos
# Notes:
#   - Do not use Jinja variables in this configuration.
#   - Omit SSL fields entirely if SSL is not in use.
#   - RHEL subscription is not registered, All 3 repositories [ <arch>_codeready-builder, <arch>_appstream, <arch>_baseos ]entries
#      are mandatory.
# Example:
# rhel_os_url_x86_64:
#  - { url: "http://crb.com/CRB/x86_64/os/", gpgkey: "http://crb.com/CRB/x86_64/os/RPM-GPG-KEY", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "x86_64_codeready-builder"}
#  - { url: "http://BaseOS.com/BaseOS/x86_64/os/", gpgkey: "http://BaseOS.com/BaseOS/x86_64/os/RPM-GPG-KEY", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "x86_64_baseos"}
#  - { url: "http://AppStream.com/AppStream/x86_64/os/", gpgkey: "http://AppStream.com/AppStream/x86_64/os/RPM-GPG-KEY", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "x86_64_appstream" }
rhel_os_url_x86_64:

# Example:
# rhel_os_url_aarch64:
#  - { url: "http://crb.com/CRB/aarch64/os/", gpgkey: "http://crb.com/CRB/aarch64/os/RPM-GPG-KEY", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "aarch64_codeready-builder" }
#  - { url: "http://BaseOS.com/BaseOS/aarch64/os/", gpgkey: "http://BaseOS.com/BaseOS/aarch64/os/RPM-GPG-KEY", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "aarch64_baseos"}
#  - { url: "http://AppStream.com/AppStream/aarch64/os/", gpgkey: "http://AppStream.com/AppStream/aarch64/os/RPM-GPG-KEY", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "aarch64_appstream" }
rhel_os_url_aarch64:

### ADVANCE CONFIGURATIONS FOR LOCAL REPO ###
# Mandatory
# This variable defines all the repo urls from where rpms will be downloaded for omnia features when cluster_os_type is rhel and arch x86_64
# Making incorrect changes to this variable can cause omnia failure. Please edit cautiously.
# 'url' defines the baseurl for the repository
# 'gpgkey' defines gpgkey for the repository
# If 'gpgkey' is kept empty then gpgcheck=0 for that repository
# 'name' A unique identifier for the registry.
omnia_repo_url_rhel_x86_64:
  - { url: "https://download.docker.com/linux/centos/10/x86_64/stable/", gpgkey: "https://download.docker.com/linux/centos/gpg", name: "docker-ce"}
  - { url: "https://dl.fedoraproject.org/pub/epel/10/Everything/x86_64/", gpgkey: "https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-10", name: "epel"}

# Mandatory
# This variable defines all the repo urls from where rpms will be downloaded for omnia features when cluster_os_type is rhel and arch aarch64 
# Making incorrect changes to this variable can cause omnia failure. Please edit cautiously.
# 'url' defines the baseurl for the repository
# 'gpgkey' defines gpgkey for the repository
# If 'gpgkey' is kept empty then gpgcheck=0 for that repository
# 'name' A unique identifier for the registry.
omnia_repo_url_rhel_aarch64:
  - { url: "https://download.docker.com/linux/centos/10/aarch64/stable/", gpgkey: "https://download.docker.com/linux/centos/gpg", name: "docker-ce"}
  - { url: "https://dl.fedoraproject.org/pub/epel/10/Everything/aarch64/", gpgkey: "https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-10", name: "epel"}


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/without_service_k8s/only_login_compiler_node/network_spec.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# This file is used to specify the network configuration.
#
# 'admin_network' is a mandatory field, essential for PXE boot and host communication."
#
# The 'admin_network' section contains the following variables:
# - 'oim_nic_name': The name of the interface on the OIM server associated with the admin network.
# - 'netmask_bits': The number of bits in the subnet mask.
# - 'primary_oim_admin_ip': The admin IP address of the OIM server which is configured.
# - 'primary_oim_bmc_ip': The iDRAC  IP address of the OIM server,
#     Mandatory only if idrac_telemetry is set to true and telemetry data needs to be collected from the OIM server.
#     Optional — can be omitted if iDRAC telemetry for the OIM server is not required.
# - 'dynamic_range': The range of dynamic IP addresses available on the admin network.
# - 'dns': The list of external DNS server IP address for the admin network.
# - 'ntp_servers': The list of NTP servers for the admin network. Each NTP server entry should include: 
#     - 'address': The IP address or hostname of the NTP server.
#     - 'type': The type of NTP entry, either 'server' or 'pool'.
#     Example:  
#     ntp_servers:
#       - { address: "172.16.10.80", type: "server" }

Networks:
- admin_network:
    oim_nic_name: "eno1"
    netmask_bits: "24"
    primary_oim_admin_ip: "172.16.107.254"
    primary_oim_bmc_ip: "" 
    dynamic_range: "172.16.107.201-172.16.107.250"
    dns: []
    ntp_servers: []


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/without_service_k8s/only_login_compiler_node/omnia_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# -----------------------------SLURM------------------------------------------------
# slurm_cluster
# List of slurm clusters
# cluster_name is required field

# nfs_storage_name
# Storage name corresponding to the NFS share to be used by slurm cluster 
# This should match with exactly with a entry in storage_config.yml

# config_sources
# defines how the Slurm configuration files are provided to the cluster.
# <conf name>: 
#    <mapping>
# <mapping> Supply the configuration values directly as a key–value map
# The conf files supported by slurm are
# slurm
# cgroup
# gres
# mpi
# helpers
# job_container
# acct_gather
# oci
# plugstack
# topology
# Thes files will be written into the slurm_config directory with .conf suffix

slurm_cluster:
  - cluster_name: slurm_cluster
    nfs_storage_name: nfs_slurm
    # config_sources:
    #   slurm:
    #     SlurmctldTimeout: 60
    #     SlurmdTimeout: 150
    #   cgroup: 
    #     CgroupPlugin: autodetect
    #     AllowedRAMSpace: 100
  
# ----------------------------SERVICE K8S------------------------------------------------------
# For service k8s cluster below parameters are required,(List)
# - cluster_name is required field

# - deployment: Exactly one entry in both the service_k8s_cluster lists must have deployment set to true to indicate where Kubernetes should be deployed.
# Please ensure corresponding cluster entry is added to high_availability_config.yml if deployment is set to true. 

# - Kubernetes SDN network.K8s_cni (Mandatory) - It can either be "calico" or "flannel".Default value assigned is "calico".
# While setting up Kubernetes plugin for RoCE NIC, ensure that this value is set to "flannel"

# - pod_external_ip_range: (Mandatory) These addresses will be used by Loadbalancer for assigning External IPs to K8s services
# Make sure the IP range is not assigned to any node in the cluster.
# Acceptable formats: "10.11.0.100-10.11.0.150" , "10.11.0.0/16"

# - k8s_service_addresses: Kubernetes internal network for services.This network must be unused in your network infrastructure.
# Default value is "10.233.0.0/18"

# - k8s_pod_network_cidr: Kubernetes pod network CIDR for internal network. When used, it will assign IP addresses from this range to individual pods.
# This network must be unused in your network infrastructure.
# Default value is "10.233.64.0/18"

# nfs_storage_name : The nfs name should be same as one of the nfs name defined in storage_config.yml to configure the server.
# ----------------------------CSI Driver------------------------------------------------------
# Following csi powerscale driver input variables are mandatory only if csi_driver_powerscale entry is present in software_config.json
# csi_powerscale_driver_secret_file_path: Absolute file path for the secret.yaml file.
# User need to download secret.yaml file and fill required data in secret file. Provided the path of the secret file here.
# File path for the values.yml file which will contain the Powerscale driver configuration parameters.
# csi_powerscale_driver_values_file_path: User need to download values.yaml file and fill required data in values.yaml file. Provided the path of the values.yaml file here.
# mention configurable values

service_k8s_cluster:
  - cluster_name: service_cluster
    deployment: true
    k8s_cni: "calico"
    pod_external_ip_range: "172.16.107.170-172.16.107.200"
    k8s_service_addresses: "10.233.0.0/18"
    k8s_pod_network_cidr: "10.233.64.0/18"
    nfs_storage_name: "nfs_k8s"
    csi_powerscale_driver_secret_file_path: ""
    csi_powerscale_driver_values_file_path: ""


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/without_service_k8s/only_login_compiler_node/provision_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

#### Mandatory
# This depicts the path where user has kept the PXE mapping file.
# The mapping file consists of the Service tag, Admin MAC,Hostname and its respective admin IP address and/or BMC IP.
# Ensure that admin IPs given in mapping file are within the network defined in the network_spec.yml
# A templates for mapping file exists in omnia/examples, namely, pxe_mapping_file.csv
# Format of csv: FUNCTIONAL_GROUP_NAME,GROUP_NAME,SERVICE_TAG,HOSTNAME,ADMIN_MAC,ADMIN_IP,BMC_MAC,BMC_IP
pxe_mapping_file_path: "/opt/omnia/input/project_default/pxe_mapping_file.csv"

#### Mandatory
# Language that needs to be set during OS provisioning.
# Only language supported is "en_US.UTF-8"
language: "en_US.UTF-8"

#### Mandatory
# Default lease time needs to be used by DHCP
# Unit: seconds
# Min: 21600
# Default: 86400
# Max: 31536000
default_lease_time: "86400"


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/without_service_k8s/only_login_compiler_node/security_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# Connection Type options: TLS or SSL
# Default: TLS (validated)
# If TLS: secure OpenLDAP connection occurs on port 389
# If SSL: secure OpenLDAP connection occurs on port 636
ldap_connection_type: "TLS"


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/without_service_k8s/only_login_compiler_node/software_config.json
================================================
{
    "cluster_os_type": "rhel",
    "cluster_os_version": "10.0",
    "repo_config": "partial",
    "softwares": [
        {"name": "default_packages", "arch": ["x86_64"]},
        {"name": "openldap", "arch": ["x86_64"]},
        {"name": "slurm_custom", "arch": ["x86_64"]}
    ],
    "slurm_custom": [
        {"name": "slurm_control_node"},
        {"name": "slurm_node"},
        {"name": "login_node"},
        {"name": "login_compiler_node"}
    ]
}


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/without_service_k8s/only_login_compiler_node/storage_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# -----------------------------NFS------------------------------------------------

# This variable is used for mounting NFS share on slurm_control_node, slurm_node, login_node
# This takes a list of dicts with possible keys server_ip, server_share_path, client_share_path, client_mount_options
# In both the cases, the USER must manually update 'server_ip' and 'server_share_path' below with the correct values.
# If mount_option values are empty, NFS client will be mounted with these values "nosuid,rw,sync,hard,intr"
# Its mandatory to provide atleast one entry in nfs_client_params
# Example for single mount file system:
# nfs_client_params:
# nfs_name : str ,Name of the NFS storage resource. The default is "nfs_storage_default".
#     The user can assign any custom string to specify a different NFS storage resource.
# - { server_ip: 10.5.0.101, server_share_path: "/mnt/share", client_share_path: "/home", client_mount_options: "nosuid,rw,sync,hard"}
# Example for supporting multiple mount points:
# nfs_client_params:
# - { server_ip: 198.168.0.1,server_share_path: "/mnt/share1", client_share_path: "/home", client_mount_options: "nosuid,rw,sync,hard"}
# - { server_ip: 198.168.0.2, server_share_path: "/mnt/share2", client_share_path: "/mnt/mount2", client_mount_options: "nosuid,rw,sync,hard"}
# Example for multiple mount file system:
# nfs_client_params:
# - { server_ip: 198.168.0.1, server_share_path: "/mnt/share1", client_share_path: "/mnt/mount1", client_mount_options: "nosuid,rw,sync,hard"}
# - { server_ip: 198.168.0.2, server_share_path: "/mnt/share2", client_share_path: "/mnt/mount2", client_mount_options: "nosuid,rw,sync,hard"}
nfs_client_params:
  - server_ip: "172.16.107.168" # Provide the IP of the NFS server
    server_share_path: "/mnt/share/omnia" # Provide server share path of the NFS Server
    client_share_path: /share_omnia
    client_mount_options: "nosuid,rw,sync,hard,intr"
    nfs_name: nfs_slurm

  - server_ip: "172.16.107.121" # Provide the IP of the NFS server
    server_share_path: "/mnt/share/omnia_k8s" # Provide server share path of the NFS Server
    client_share_path: /share_omnia_k8s
    client_mount_options: "nosuid,rw,sync,hard,intr"
    nfs_name: nfs_k8s


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/without_service_k8s/only_login_compiler_node/telemetry_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# ============================================================================
# TELEMETRY CONFIGURATION OVERVIEW
# ============================================================================
# This file configures telemetry data collection and storage for Dell Omnia.
#
# SECTIONS:
#   1. iDRAC Telemetry    : Hardware metrics from Dell PowerEdge servers
#   2. VictoriaMetrics    : Time-series database for metric storage
#   3. Kafka              : Distributed streaming platform for telemetry data
#   4. LDMS               : Lightweight Distributed Metric Service for compute nodes
#
# ============================================================================
# STORAGE REQUIREMENTS SUMMARY
# ============================================================================
# 
# VICTORIAMETRICS STORAGE:
# ┌─────────────────┬──────────────────┬─────────────────┬──────────────────┐
# │ Deployment Mode │ Per-Pod Storage  │ Number of Pods  │ Total Storage    │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Single-node     │ persistence_size │ 1 pod           │ 1× storage       │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Cluster         │ persistence_size │ 3 vmstorage     │ 3× storage       │
# └─────────────────┴──────────────────┴─────────────────┴──────────────────┘
# Example: 8Gi per pod → Single-node: 8Gi total, Cluster: 24Gi total
#
# KAFKA STORAGE:
# ┌─────────────────┬──────────────────┬─────────────────┬──────────────────┐
# │ Component       │ Per-Pod Storage  │ Number of Pods  │ Total Storage    │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Kafka Broker    │ persistence_size │ 3 pods          │ 3× storage       │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Kafka Controller│ persistence_size │ 3 pods          │ 3× storage       │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ TOTAL KAFKA     │ persistence_size │ 6 pods          │ 6× storage       │
# └─────────────────┴──────────────────┴─────────────────┴──────────────────┘
# Example: 8Gi per pod → 48Gi total Kafka storage
#
# COMBINED STORAGE EXAMPLES:
#   Default (8Gi each): VictoriaMetrics Cluster (24Gi) + Kafka (48Gi) = 72Gi total
#   Single-node mode:   VictoriaMetrics Single (8Gi) + Kafka (48Gi) = 56Gi total
#
# STORAGE OPTIONS:
#   - VictoriaMetrics: Store iDRAC telemetry in time-series database
#   - Kafka: Stream iDRAC and LDMS telemetry to Kafka topics
#   - Both: Store iDRAC in both Victoria and Kafka (recommended)
# ============================================================================

# ============================================================================
# iDRAC TELEMETRY CONFIGURATION
# ============================================================================
# iDRAC telemetry collects hardware metrics from Dell PowerEdge servers.
# Telemetry data can be stored in VictoriaMetrics, Kafka, or both.

# Enable or disable iDRAC telemetry support
# Accepted values: true or false
# Default: true
idrac_telemetry_support: true

# Specify where to store iDRAC telemetry data
# Supported values:
#   - "victoria"        : Store in VictoriaMetrics only
#   - "kafka"           : Store in Kafka only
#   - "victoria,kafka"  : Store in both (recommended)
# Default: "victoria,kafka"
idrac_telemetry_collection_type: "victoria,kafka"

# ============================================================================
# VICTORIAMETRICS CONFIGURATION
# ============================================================================
# VictoriaMetrics is a time-series database for storing telemetry metrics.
# Used for iDRAC telemetry when 'victoria' is enabled in idrac_telemetry_collection_type.
#
# DEPLOYMENT MODES:
#   - single-node: Simple deployment with one pod (suitable for small deployments)
#   - cluster: High-availability deployment with multiple components
#               (recommended for production and large-scale deployments)
victoria_configurations:
  # VictoriaMetrics deployment mode
  # Supported values:
  #   - "single-node" : Simple deployment (1 pod, suitable for dev/test)
  #   - "cluster"     : High-availability deployment (7 pods, recommended for production)
  # Default: "cluster"
  #
  # Cluster Mode Benefits:
  #   - High availability (no single point of failure)
  #   - Horizontal scalability (scale components independently)
  #   - Better performance (4x ingestion, 2x query speed)
  #   - Production-ready architecture
  #
  # Single-Node Benefits:
  #   - Simple setup (fewer resources)
  #   - Suitable for small deployments (<10 nodes)
  #   - Lower resource usage (~4Gi memory vs ~10Gi for cluster)
  deployment_mode: "cluster"

  # The amount of storage allocated for EACH VictoriaMetrics persistent volume.
  # IMPORTANT: Total VictoriaMetrics storage depends on deployment mode:
  #   - Single-node mode: Total storage = persistence_size × 1 pod
  #   - Cluster mode: Total storage = persistence_size × 3 vmstorage pods
  #   - Example (cluster): 8Gi × 3 = 24Gi total VictoriaMetrics storage
  # Accepted values: in the form of "X[Ki|Mi|Gi|Ti|Pi|Ei]"
  # Default: 8Gi (results in 24Gi total storage for cluster mode)
  persistence_size: "8Gi"

  # Duration (in hours) to retain victoria logs before they are deleted.
  # Default: 168 (7 days)
  retention_period: 168

# ============================================================================
# KAFKA CONFIGURATION
# ============================================================================
# Apache Kafka is a distributed streaming platform for storing telemetry data.
# Used for iDRAC telemetry when 'kafka' is enabled in idrac_telemetry_collection_type.
# Also used for LDMS telemetry when LDMS software is configured.
#
# NOTE: Kafka topics are auto-generated based on enabled features:
#   - 'idrac' topic: Required when idrac_telemetry_support=true and 'kafka' is enabled
#   - 'ldms' topic:  Required when LDMS is configured in software_config.json
kafka_configurations:
  # The amount of storage allocated for EACH Kafka persistent volume.
  # IMPORTANT: Total Kafka storage = persistence_size × 6 pods
  #   - 3 Kafka brokers (each gets persistence_size storage)
  #   - 3 Kafka controllers (each gets persistence_size storage)
  #   - Example: 8Gi × 6 = 48Gi total Kafka storage
  # Accepted values: in the form of "X[Ki|Mi|Gi|Ti|Pi|Ei]"
  # Default: 8Gi (results in 48Gi total storage)
  persistence_size: "8Gi"

  # The number of hours to retain Kafka logs before they are deleted.
  # Default: 168 (7 days)
  log_retention_hours: 168

  # The maximum size of Kafka logs (in bytes) before they are deleted.
  # Default: -1 (unlimited)
  log_retention_bytes: -1

  # The maximum size of Kafka log segments (in bytes) before they are deleted.
  # Default: 1073741824 (1 GB)
  log_segment_bytes: 1073741824

  # Kafka Topic Partitions Configuration
  # ----------------------------------------------------------------------------
  # Define the number of partitions for each Kafka topic.
  # Increasing partitions can improve throughput but also increases storage/overhead.
  #
  # IMPORTANT: Topic names are FIXED and cannot be changed.
  #   - Topic names: Only 'idrac' and 'ldms' are allowed
  #   - Configurable: Only partition counts can be modified
  #
  # Topic Requirements (auto-validated):
  #   - 'idrac': Required when idrac_telemetry_support=true and 'kafka' is enabled
  #   - 'ldms':  Required when LDMS software is configured in software_config.json
  #
  # Default partition counts: idrac=1, ldms=2
  topic_partitions:
    - name: "idrac"
      partitions: 1
    - name: "ldms"
      partitions: 2

# ============================================================================
# LDMS (Lightweight Distributed Metric Service) CONFIGURATION
# ============================================================================
# LDMS collects performance metrics from compute nodes (CPU, memory, network, etc.)
# and streams them to Kafka for storage and analysis.
#
# PREREQUISITE: To enable LDMS support, add the following to software_config.json:
#   {
#     "softwares": [
#       {"name": "ldms", "arch": ["x86_64", "aarch64"]}
#     ]
#   }
#
# When LDMS software is configured, the 'ldms' topic MUST be defined in
# kafka_configurations.topic_partitions above.
#
# LDMS Port Configurations
# Aggregator port on service k8s cluster
# Valid range: 6001-6100
# Default: 6001
ldms_agg_port: 6001

# Store daemon port on service k8s cluster
# Can be the same as ldms_agg_port
# Valid range: 6001-6100
# Default: 6001
ldms_store_port: 6001

# Sampler port on compute nodes
# Valid range: 10001-10100
# Default: 10001
ldms_sampler_port: 10001

# LDMS Sampler Plugin Configurations
# ----------------------------------------------------------------------------
# Configure which metrics to collect from compute nodes and collection intervals.
# Each plugin collects specific system metrics.
#
# Parameters:
#   - plugin_name: Name of the LDMS sampler plugin
#   - config_parameters: Plugin-specific configuration (as a single string)
#   - activation_parameters: Collection schedule in MICROSECONDS
#       Format: "interval=<microseconds> offset=<microseconds>"
#       Example: "interval=1000000"         (1000000 microseconds = 1 second)
#                "interval=1000000 offset=0" (1000000 microseconds with no offset)
#
# Available Plugins:
#   - meminfo: Memory usage statistics
#   - procstat2: Process statistics
#   - vmstat: Virtual memory statistics
#   - loadavg: System load average
#   - procnetdev2: Network interface statistics
ldms_sampler_configurations:
  # Memory usage statistics (free, used, buffers, cached, etc.)
  - plugin_name: meminfo
    config_parameters: ""
    activation_parameters: "interval=1000000"  # interval=1000000 microseconds

  # Process statistics (CPU, memory, I/O per process)
  - plugin_name: procstat2
    config_parameters: ""
    activation_parameters: "interval=1000000"  # interval=1000000 microseconds

  # Virtual memory statistics (paging, swapping, memory pressure)
  - plugin_name: vmstat
    config_parameters: ""
    activation_parameters: "interval=1000000"  # interval=1000000 microseconds

  # System load average (1, 5, and 15 minute averages)
  - plugin_name: loadavg
    config_parameters: ""
    activation_parameters: "interval=1000000"  # interval=1000000 microseconds

  # Network interface statistics (bytes, packets, errors, drops per interface)
  # Config parameters (optional):
  #   - ifaces=eth0,eth1: Specific interfaces to monitor
  #   - If not specified, all network interfaces will be monitored
  - plugin_name: procnetdev2
    config_parameters: ""  # Monitor all interfaces
    activation_parameters: "interval=1000000 offset=0"  # interval=1000000 microseconds, offset=0


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/without_service_k8s/only_login_compiler_node/user_registry_credential.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************
# user_registry credential manager
# name: User registry name, name should match exact name provided in local_repo_config.yml
# username: Provide if user registry requires username to authenticate
# password: Provide if user registry requires password to authenticate

user_registry_credential:
  - {name: "", username: "", password: ""}


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/without_service_k8s/only_login_node/high_availability_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# ***********************************************************************
# High Availability (HA) Configuration for Kubernetes (K8s) Service Node(List)
# - cluster_name is required field it should match one of the values defined in omnia_config.yml where deployment is set to true.
# - enable_k8s_ha: <Mandatory> Indicates whether to enable HA for the Kubernetes (K8s) service node. Set to 'true' to enable, 'false' to disable.
# - virtual_ip_address: <Mandatory if enable_k8s_ha is true> The virtual IP address for the K8s service node HA setup.
# ***********************************************************************

service_k8s_cluster_ha:
  - cluster_name: service_cluster
    enable_k8s_ha: true
    virtual_ip_address: "172.16.107.1"

================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/without_service_k8s/only_login_node/local_repo_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# You may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# ================================
# VARIABLE DETAILS
# ================================
# 1. user_repo_url_x86_64
#--------------------------
#    Optional list of user-defined repository URLs for x86_64 architecture.
#    Each entry can include: url, gpgkey, sslcacert, sslclientkey, sslclientcert, name, policy.
#    Used for custom cluster packages like <arch>_slurm_custom.
# Fields:
#   url         : Base URL of the repository
#   gpgkey      : GPG key URL (leave empty to disable gpgcheck; Omnia will trust this repo and user is responsible for its security)
#   name        : Name of the repository
#   sslcacert   : Path to SSL CA certificate (if using SSL)
#   sslclientkey: Path to SSL client key (if using SSL)
#   sslclientcert: Path to SSL client certificate (if using SSL)
#   policy      : Repository policy (always, partial)
# Notes:
#   - Do not use Jinja variables in this configuration.
#   - Omit SSL fields entirely if SSL is not in use.
#   - Its a madatory field in case of slurm_custom with name as '<arch>_slurm_custom'
#
# 2. user_repo_url_aarch64
#---------------------------
#    Same as above but for aarch64 architecture.
#
# 4. rhel_os_url_x86_64
#-----------------------------
#    Mandatory when RHEL subscription is not registered.
#    Contains repository URLs for codeready-builder, baseos, and appstream for x86_64.
# Fields:
#   url         : Base URL of the repository
#   gpgkey      : GPG key URL (leave empty to disable gpgcheck; Omnia will trust this repo and user is responsible for its security)
#   sslcacert   : Path to SSL CA certificate (if using SSL)
#   sslclientkey: Path to SSL client key (if using SSL)
#   sslclientcert: Path to SSL client certificate (if using SSL)
#   policy      : Repository policy if mentioned allowed values (always, partial). IF not mentioned will consider from software_config.json
#   name        : Name of the repository [ Allowed repo names <arch>_codeready-builder, <arch>_appstream, <arch>_baseos
# Notes:
#   - Do not use Jinja variables in this configuration.
#   - Omit SSL fields entirely if SSL is not in use.
#   - RHEL subscription is not registered, All 3 repositories [ <arch>_codeready-builder, <arch>_appstream, <arch>_baseos ]entries
#      are mandatory.
#
# 5. rhel_os_url_aarch64
#----------------------------
#    Same as above but for aarch64 architecture.
#
#### ADVANCE CONFIGURATIONS FOR LOCAL REPO ###
# 6. omnia_repo_url_rhel_x86_64
#-------------------------------
#    Mandatory repository URLs for downloading RPMS for Omnia features on RHEL x86_64.
#    Each entry includes url, gpgkey, and name.
#
# This variable defines all the repo urls from where rpms will be downloaded for omnia features when cluster_os_type is rhel and arch x86_64
# Making incorrect changes to this variable can cause omnia failure. Please edit cautiously.
# Fields:
#  url        : Base URL of the repository.
#  gpgkey     : URL of the GPG key for the repository.
#                   If left empty, gpgcheck=0 for that repository.
#  name       : A unique identifier for the repository or registry.
#
# 7. omnia_repo_url_rhel_aarch64
#--------------------------------
#    Same as above but for RHEL aarch64.

# ================================
# VARIABLES
# ================================
# Example    
# user_repo_url_x86_64:
#  - { url: "", gpgkey: "", sslcacert: "", sslclientkey: "", sslclientcert: "",  name: "x86_64_slurm_custom" }
user_repo_url_x86_64:
user_repo_url_aarch64:
#Example:
# rhel_os_url_x86_64:
#  - { url: "http://crb.com/CRB/x86_64/os/", gpgkey: "http://crb.com/CRB/x86_64/os/RPM-GPG-KEY", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "x86_64_codeready-builder"}
#  - { url: "http://BaseOS.com/BaseOS/x86_64/os/", gpgkey: "http://BaseOS.com/BaseOS/x86_64/os/RPM-GPG-KEY", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "x86_64_baseos"}
#  - { url: "http://AppStream.com/AppStream/x86_64/os/", gpgkey: "http://AppStream.com/AppStream/x86_64/os/RPM-GPG-KEY", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "x86_64_appstream" }
rhel_os_url_x86_64:
rhel_os_url_aarch64:
# Making incorrect changes to this variable can cause omnia failure. Please edit cautiously.
omnia_repo_url_rhel_x86_64:
  - { url: "https://download.docker.com/linux/centos/10/x86_64/stable/", gpgkey: "https://download.docker.com/linux/centos/gpg", name: "docker-ce"}
  - { url: "https://dl.fedoraproject.org/pub/epel/10/Everything/x86_64/", gpgkey: "https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-10", name: "epel"}
  - { url: "https://pkgs.k8s.io/core:/stable:/v1.34/rpm/", gpgkey: "https://pkgs.k8s.io/core:/stable:/v1.34/rpm/repodata/repomd.xml.key", name: "kubernetes"}
  - { url: "https://download.opensuse.org/repositories/isv:/cri-o:/stable:/v1.34/rpm/", gpgkey: "https://download.opensuse.org/repositories/isv:/cri-o:/stable:/v1.34/rpm/repodata/repomd.xml.key'", name: "cri-o"}
omnia_repo_url_rhel_aarch64:
  - { url: "https://download.docker.com/linux/centos/10/aarch64/stable/", gpgkey: "https://download.docker.com/linux/centos/gpg", name: "docker-ce"}
  - { url: "https://dl.fedoraproject.org/pub/epel/10/Everything/aarch64/", gpgkey: "https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-10", name: "epel"}


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/without_service_k8s/only_login_node/network_spec.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# This file is used to specify the network configuration.
#
# 'admin_network' is a mandatory field, essential for PXE boot and host communication."
#
# The 'admin_network' section contains the following variables:
# - 'oim_nic_name': The name of the interface on the OIM server associated with the admin network.
# - 'netmask_bits': The number of bits in the subnet mask.
# - 'primary_oim_admin_ip': The admin IP address of the OIM server which is configured.
# - 'primary_oim_bmc_ip': The iDRAC  IP address of the OIM server,
#     Mandatory only if idrac_telemetry is set to true and telemetry data needs to be collected from the OIM server.
#     Optional — can be omitted if iDRAC telemetry for the OIM server is not required.
# - 'dynamic_range': The range of dynamic IP addresses available on the admin network.
# - 'dns': The list of external DNS server IP address for the admin network.
# - 'ntp_servers': The list of NTP servers for the admin network. Each NTP server entry should include: 
#     - 'address': The IP address or hostname of the NTP server.
#     - 'type': The type of NTP entry, either 'server' or 'pool'.
#     Example:  
#     ntp_servers:
#       - { address: "172.16.10.80", type: "server" }

Networks:
- admin_network:
    oim_nic_name: "eno1"
    netmask_bits: "24"
    primary_oim_admin_ip: "172.16.107.254"
    primary_oim_bmc_ip: "" 
    dynamic_range: "172.16.107.201-172.16.107.250"
    dns: []
    ntp_servers: []


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/without_service_k8s/only_login_node/omnia_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# -----------------------------SLURM------------------------------------------------
# slurm_cluster
# List of slurm clusters
# cluster_name is required field

# nfs_storage_name
# Storage name corresponding to the NFS share to be used by slurm cluster 
# This should match with exactly with a entry in storage_config.yml

# config_sources
# defines how the Slurm configuration files are provided to the cluster.
# <conf name>: 
#    <mapping>
# <mapping> Supply the configuration values directly as a key–value map
# The conf files supported by slurm are
# slurm
# cgroup
# gres
# mpi
# helpers
# job_container
# acct_gather
# oci
# plugstack
# topology
# Thes files will be written into the slurm_config directory with .conf suffix

slurm_cluster:
  - cluster_name: slurm_cluster
    nfs_storage_name: nfs_slurm
    # config_sources:
    #   slurm:
    #     SlurmctldTimeout: 60
    #     SlurmdTimeout: 150
    #   cgroup: 
    #     CgroupPlugin: autodetect
    #     AllowedRAMSpace: 100
  
# ----------------------------SERVICE K8S------------------------------------------------------
# For service k8s cluster below parameters are required,(List)
# - cluster_name is required field

# - deployment: Exactly one entry in both the service_k8s_cluster lists must have deployment set to true to indicate where Kubernetes should be deployed.
# Please ensure corresponding cluster entry is added to high_availability_config.yml if deployment is set to true. 

# - Kubernetes SDN network.K8s_cni (Mandatory) - It can either be "calico" or "flannel".Default value assigned is "calico".
# While setting up Kubernetes plugin for RoCE NIC, ensure that this value is set to "flannel"

# - pod_external_ip_range: (Mandatory) These addresses will be used by Loadbalancer for assigning External IPs to K8s services
# Make sure the IP range is not assigned to any node in the cluster.
# Acceptable formats: "10.11.0.100-10.11.0.150" , "10.11.0.0/16"

# - k8s_service_addresses: Kubernetes internal network for services.This network must be unused in your network infrastructure.
# Default value is "10.233.0.0/18"

# - k8s_pod_network_cidr: Kubernetes pod network CIDR for internal network. When used, it will assign IP addresses from this range to individual pods.
# This network must be unused in your network infrastructure.
# Default value is "10.233.64.0/18"

# nfs_storage_name : The nfs name should be same as one of the nfs name defined in storage_config.yml to configure the server.
# ----------------------------CSI Driver------------------------------------------------------
# Following csi powerscale driver input variables are mandatory only if csi_driver_powerscale entry is present in software_config.json
# csi_powerscale_driver_secret_file_path: Absolute file path for the secret.yaml file.
# User need to download secret.yaml file and fill required data in secret file. Provided the path of the secret file here.
# File path for the values.yml file which will contain the Powerscale driver configuration parameters.
# csi_powerscale_driver_values_file_path: User need to download values.yaml file and fill required data in values.yaml file. Provided the path of the values.yaml file here.
# mention configurable values

service_k8s_cluster:
  - cluster_name: service_cluster
    deployment: true
    k8s_cni: "calico"
    pod_external_ip_range: "172.16.107.170-172.16.107.200"
    k8s_service_addresses: "10.233.0.0/18"
    k8s_pod_network_cidr: "10.233.64.0/18"
    nfs_storage_name: "nfs_k8s"
    csi_powerscale_driver_secret_file_path: ""
    csi_powerscale_driver_values_file_path: ""


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/without_service_k8s/only_login_node/provision_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

#### Mandatory
# This depicts the path where user has kept the PXE mapping file.
# The mapping file consists of the Service tag, Admin MAC,Hostname and its respective admin IP address and/or BMC IP.
# Ensure that admin IPs given in mapping file are within the network defined in the network_spec.yml
# A templates for mapping file exists in omnia/examples, namely, pxe_mapping_file.csv
# Format of csv: FUNCTIONAL_GROUP_NAME,GROUP_NAME,SERVICE_TAG,HOSTNAME,ADMIN_MAC,ADMIN_IP,BMC_MAC,BMC_IP
pxe_mapping_file_path: "/opt/omnia/input/project_default/pxe_mapping_file.csv"

#### Mandatory
# Language that needs to be set during OS provisioning.
# Only language supported is "en_US.UTF-8"
language: "en_US.UTF-8"

#### Mandatory
# Default lease time needs to be used by DHCP
# Unit: seconds
# Min: 21600
# Default: 86400
# Max: 31536000
default_lease_time: "86400"


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/without_service_k8s/only_login_node/security_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# Connection Type options: TLS or SSL
# Default: TLS (validated)
# If TLS: secure OpenLDAP connection occurs on port 389
# If SSL: secure OpenLDAP connection occurs on port 636
ldap_connection_type: "TLS"


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/without_service_k8s/only_login_node/software_config.json
================================================
{
    "cluster_os_type": "rhel",
    "cluster_os_version": "10.0",
    "repo_config": "partial",
    "softwares": [
        {"name": "default_packages", "arch": ["x86_64"]},
        {"name": "openldap", "arch": ["x86_64"]},
        {"name": "slurm_custom", "arch": ["x86_64"]}
    ],
    "slurm_custom": [
        {"name": "slurm_control_node"},
        {"name": "slurm_node"},
        {"name": "login_node"}    
    ]
}


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/without_service_k8s/only_login_node/storage_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# -----------------------------NFS------------------------------------------------

# This variable is used for mounting NFS share on slurm_control_node, slurm_node, login_node
# This takes a list of dicts with possible keys server_ip, server_share_path, client_share_path, client_mount_options
# In both the cases, the USER must manually update 'server_ip' and 'server_share_path' below with the correct values.
# If mount_option values are empty, NFS client will be mounted with these values "nosuid,rw,sync,hard,intr"
# Its mandatory to provide atleast one entry in nfs_client_params
# Example for single mount file system:
# nfs_client_params:
# nfs_name : str ,Name of the NFS storage resource. The default is "nfs_storage_default".
#     The user can assign any custom string to specify a different NFS storage resource.
# - { server_ip: 10.5.0.101, server_share_path: "/mnt/share", client_share_path: "/home", client_mount_options: "nosuid,rw,sync,hard"}
# Example for supporting multiple mount points:
# nfs_client_params:
# - { server_ip: 198.168.0.1,server_share_path: "/mnt/share1", client_share_path: "/home", client_mount_options: "nosuid,rw,sync,hard"}
# - { server_ip: 198.168.0.2, server_share_path: "/mnt/share2", client_share_path: "/mnt/mount2", client_mount_options: "nosuid,rw,sync,hard"}
# Example for multiple mount file system:
# nfs_client_params:
# - { server_ip: 198.168.0.1, server_share_path: "/mnt/share1", client_share_path: "/mnt/mount1", client_mount_options: "nosuid,rw,sync,hard"}
# - { server_ip: 198.168.0.2, server_share_path: "/mnt/share2", client_share_path: "/mnt/mount2", client_mount_options: "nosuid,rw,sync,hard"}
nfs_client_params:
  - server_ip: "172.16.107.168" # Provide the IP of the NFS server
    server_share_path: "/mnt/share/omnia" # Provide server share path of the NFS Server
    client_share_path: /share_omnia
    client_mount_options: "nosuid,rw,sync,hard,intr"
    nfs_name: nfs_slurm

  - server_ip: "172.16.107.121" # Provide the IP of the NFS server
    server_share_path: "/mnt/share/omnia_k8s" # Provide server share path of the NFS Server
    client_share_path: /share_omnia_k8s
    client_mount_options: "nosuid,rw,sync,hard,intr"
    nfs_name: nfs_k8s


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/without_service_k8s/only_login_node/telemetry_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# ============================================================================
# TELEMETRY CONFIGURATION OVERVIEW
# ============================================================================
# This file configures telemetry data collection and storage for Dell Omnia.
#
# SECTIONS:
#   1. iDRAC Telemetry    : Hardware metrics from Dell PowerEdge servers
#   2. VictoriaMetrics    : Time-series database for metric storage
#   3. Kafka              : Distributed streaming platform for telemetry data
#   4. LDMS               : Lightweight Distributed Metric Service for compute nodes
#
# ============================================================================
# STORAGE REQUIREMENTS SUMMARY
# ============================================================================
# 
# VICTORIAMETRICS STORAGE:
# ┌─────────────────┬──────────────────┬─────────────────┬──────────────────┐
# │ Deployment Mode │ Per-Pod Storage  │ Number of Pods  │ Total Storage    │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Single-node     │ persistence_size │ 1 pod           │ 1× storage       │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Cluster         │ persistence_size │ 3 vmstorage     │ 3× storage       │
# └─────────────────┴──────────────────┴─────────────────┴──────────────────┘
# Example: 8Gi per pod → Single-node: 8Gi total, Cluster: 24Gi total
#
# KAFKA STORAGE:
# ┌─────────────────┬──────────────────┬─────────────────┬──────────────────┐
# │ Component       │ Per-Pod Storage  │ Number of Pods  │ Total Storage    │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Kafka Broker    │ persistence_size │ 3 pods          │ 3× storage       │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Kafka Controller│ persistence_size │ 3 pods          │ 3× storage       │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ TOTAL KAFKA     │ persistence_size │ 6 pods          │ 6× storage       │
# └─────────────────┴──────────────────┴─────────────────┴──────────────────┘
# Example: 8Gi per pod → 48Gi total Kafka storage
#
# COMBINED STORAGE EXAMPLES:
#   Default (8Gi each): VictoriaMetrics Cluster (24Gi) + Kafka (48Gi) = 72Gi total
#   Single-node mode:   VictoriaMetrics Single (8Gi) + Kafka (48Gi) = 56Gi total
#
# STORAGE OPTIONS:
#   - VictoriaMetrics: Store iDRAC telemetry in time-series database
#   - Kafka: Stream iDRAC and LDMS telemetry to Kafka topics
#   - Both: Store iDRAC in both Victoria and Kafka (recommended)
# ============================================================================

# ============================================================================
# iDRAC TELEMETRY CONFIGURATION
# ============================================================================
# iDRAC telemetry collects hardware metrics from Dell PowerEdge servers.
# Telemetry data can be stored in VictoriaMetrics, Kafka, or both.

# Enable or disable iDRAC telemetry support
# Accepted values: true or false
# Default: true
idrac_telemetry_support: true

# Specify where to store iDRAC telemetry data
# Supported values:
#   - "victoria"        : Store in VictoriaMetrics only
#   - "kafka"           : Store in Kafka only
#   - "victoria,kafka"  : Store in both (recommended)
# Default: "victoria,kafka"
idrac_telemetry_collection_type: "victoria,kafka"

# ============================================================================
# VICTORIAMETRICS CONFIGURATION
# ============================================================================
# VictoriaMetrics is a time-series database for storing telemetry metrics.
# Used for iDRAC telemetry when 'victoria' is enabled in idrac_telemetry_collection_type.
#
# DEPLOYMENT MODES:
#   - single-node: Simple deployment with one pod (suitable for small deployments)
#   - cluster: High-availability deployment with multiple components
#               (recommended for production and large-scale deployments)
victoria_configurations:
  # VictoriaMetrics deployment mode
  # Supported values:
  #   - "single-node" : Simple deployment (1 pod, suitable for dev/test)
  #   - "cluster"     : High-availability deployment (7 pods, recommended for production)
  # Default: "cluster"
  #
  # Cluster Mode Benefits:
  #   - High availability (no single point of failure)
  #   - Horizontal scalability (scale components independently)
  #   - Better performance (4x ingestion, 2x query speed)
  #   - Production-ready architecture
  #
  # Single-Node Benefits:
  #   - Simple setup (fewer resources)
  #   - Suitable for small deployments (<10 nodes)
  #   - Lower resource usage (~4Gi memory vs ~10Gi for cluster)
  deployment_mode: "cluster"

  # The amount of storage allocated for EACH VictoriaMetrics persistent volume.
  # IMPORTANT: Total VictoriaMetrics storage depends on deployment mode:
  #   - Single-node mode: Total storage = persistence_size × 1 pod
  #   - Cluster mode: Total storage = persistence_size × 3 vmstorage pods
  #   - Example (cluster): 8Gi × 3 = 24Gi total VictoriaMetrics storage
  # Accepted values: in the form of "X[Ki|Mi|Gi|Ti|Pi|Ei]"
  # Default: 8Gi (results in 24Gi total storage for cluster mode)
  persistence_size: "8Gi"

  # Duration (in hours) to retain victoria logs before they are deleted.
  # Default: 168 (7 days)
  retention_period: 168

# ============================================================================
# KAFKA CONFIGURATION
# ============================================================================
# Apache Kafka is a distributed streaming platform for storing telemetry data.
# Used for iDRAC telemetry when 'kafka' is enabled in idrac_telemetry_collection_type.
# Also used for LDMS telemetry when LDMS software is configured.
#
# NOTE: Kafka topics are auto-generated based on enabled features:
#   - 'idrac' topic: Required when idrac_telemetry_support=true and 'kafka' is enabled
#   - 'ldms' topic:  Required when LDMS is configured in software_config.json
kafka_configurations:
  # The amount of storage allocated for EACH Kafka persistent volume.
  # IMPORTANT: Total Kafka storage = persistence_size × 6 pods
  #   - 3 Kafka brokers (each gets persistence_size storage)
  #   - 3 Kafka controllers (each gets persistence_size storage)
  #   - Example: 8Gi × 6 = 48Gi total Kafka storage
  # Accepted values: in the form of "X[Ki|Mi|Gi|Ti|Pi|Ei]"
  # Default: 8Gi (results in 48Gi total storage)
  persistence_size: "8Gi"

  # The number of hours to retain Kafka logs before they are deleted.
  # Default: 168 (7 days)
  log_retention_hours: 168

  # The maximum size of Kafka logs (in bytes) before they are deleted.
  # Default: -1 (unlimited)
  log_retention_bytes: -1

  # The maximum size of Kafka log segments (in bytes) before they are deleted.
  # Default: 1073741824 (1 GB)
  log_segment_bytes: 1073741824

  # Kafka Topic Partitions Configuration
  # ----------------------------------------------------------------------------
  # Define the number of partitions for each Kafka topic.
  # Increasing partitions can improve throughput but also increases storage/overhead.
  #
  # IMPORTANT: Topic names are FIXED and cannot be changed.
  #   - Topic names: Only 'idrac' and 'ldms' are allowed
  #   - Configurable: Only partition counts can be modified
  #
  # Topic Requirements (auto-validated):
  #   - 'idrac': Required when idrac_telemetry_support=true and 'kafka' is enabled
  #   - 'ldms':  Required when LDMS software is configured in software_config.json
  #
  # Default partition counts: idrac=1, ldms=2
  topic_partitions:
    - name: "idrac"
      partitions: 1
    - name: "ldms"
      partitions: 2

# ============================================================================
# LDMS (Lightweight Distributed Metric Service) CONFIGURATION
# ============================================================================
# LDMS collects performance metrics from compute nodes (CPU, memory, network, etc.)
# and streams them to Kafka for storage and analysis.
#
# PREREQUISITE: To enable LDMS support, add the following to software_config.json:
#   {
#     "softwares": [
#       {"name": "ldms", "arch": ["x86_64", "aarch64"]}
#     ]
#   }
#
# When LDMS software is configured, the 'ldms' topic MUST be defined in
# kafka_configurations.topic_partitions above.
#
# LDMS Port Configurations
# Aggregator port on service k8s cluster
# Valid range: 6001-6100
# Default: 6001
ldms_agg_port: 6001

# Store daemon port on service k8s cluster
# Can be the same as ldms_agg_port
# Valid range: 6001-6100
# Default: 6001
ldms_store_port: 6001

# Sampler port on compute nodes
# Valid range: 10001-10100
# Default: 10001
ldms_sampler_port: 10001

# LDMS Sampler Plugin Configurations
# ----------------------------------------------------------------------------
# Configure which metrics to collect from compute nodes and collection intervals.
# Each plugin collects specific system metrics.
#
# Parameters:
#   - plugin_name: Name of the LDMS sampler plugin
#   - config_parameters: Plugin-specific configuration (as a single string)
#   - activation_parameters: Collection schedule in MICROSECONDS
#       Format: "interval=<microseconds> offset=<microseconds>"
#       Example: "interval=1000000"         (1000000 microseconds = 1 second)
#                "interval=1000000 offset=0" (1000000 microseconds with no offset)
#
# Available Plugins:
#   - meminfo: Memory usage statistics
#   - procstat2: Process statistics
#   - vmstat: Virtual memory statistics
#   - loadavg: System load average
#   - procnetdev2: Network interface statistics
ldms_sampler_configurations:
  # Memory usage statistics (free, used, buffers, cached, etc.)
  - plugin_name: meminfo
    config_parameters: ""
    activation_parameters: "interval=1000000"  # interval=1000000 microseconds

  # Process statistics (CPU, memory, I/O per process)
  - plugin_name: procstat2
    config_parameters: ""
    activation_parameters: "interval=1000000"  # interval=1000000 microseconds

  # Virtual memory statistics (paging, swapping, memory pressure)
  - plugin_name: vmstat
    config_parameters: ""
    activation_parameters: "interval=1000000"  # interval=1000000 microseconds

  # System load average (1, 5, and 15 minute averages)
  - plugin_name: loadavg
    config_parameters: ""
    activation_parameters: "interval=1000000"  # interval=1000000 microseconds

  # Network interface statistics (bytes, packets, errors, drops per interface)
  # Config parameters (optional):
  #   - ifaces=eth0,eth1: Specific interfaces to monitor
  #   - If not specified, all network interfaces will be monitored
  - plugin_name: procnetdev2
    config_parameters: ""  # Monitor all interfaces
    activation_parameters: "interval=1000000 offset=0"  # interval=1000000 microseconds, offset=0


================================================
FILE: examples/input_template/bare_metal_slurm/x86_64/without_service_k8s/only_login_node/user_registry_credential.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************
# user_registry credential manager
# name: User registry name, name should match exact name provided in local_repo_config.yml
# username: Provide if user registry requires username to authenticate
# password: Provide if user registry requires password to authenticate

user_registry_credential:
  - {name: "", username: "", password: ""}


================================================
FILE: examples/inventory/bmc_inventory_file
================================================
[bmc]
10.x.0.2
10.x.0.3


================================================
FILE: examples/pxe_mapping_file.csv
================================================
FUNCTIONAL_GROUP_NAME,GROUP_NAME,SERVICE_TAG,PARENT_SERVICE_TAG,HOSTNAME,ADMIN_MAC,ADMIN_IP,BMC_MAC,BMC_IP
slurm_control_node_x86_64,grp0,ABCD12,,slurm-control-node1,xx:yy:zz:aa:bb:cc,172.16.107.52,xx:yy:zz:aa:bb:dd,172.17.107.52
slurm_node_aarch64,grp1,ABCD34,ABFL82,slurm-node1,aa:bb:cc:dd:ee:ff,172.16.107.43,aa:bb:cc:dd:ee:gg,172.17.107.43
slurm_node_aarch64,grp2,ABFG34,ABKD88,slurm-node2,aa:bb:cc:dd:ee:ff,172.16.107.44,aa:bb:cc:dd:ff:gg,172.17.107.44
login_compiler_node_aarch64,grp8,ABCD78,,login-compiler-node1,aa:bb:cc:dd:ee:gg,172.16.107.41,aa:bb:cc:dd:ee:bb,172.17.107.41
login_node_x86_64,grp9,ABFG78,,login-node1,aa:bb:cc:dd:ee:gg,172.16.107.42,aa:bb:cc:dd:ee:bb,172.17.107.42
service_kube_control_plane_x86_64,grp3,ABFG79,,service-kube-control-plane1,aa:bb:cc:dd:ee:ff,172.16.107.53,xx:yy:zz:aa:bb:ff,172.17.107.53
service_kube_control_plane_x86_64,grp4,ABFH78,,service-kube-control-plane2,aa:bb:cc:dd:ee:hh,172.16.107.54,xx:yy:zz:aa:bb:hh,172.17.107.54
service_kube_control_plane_x86_64,grp4,ABFH80,,service-kube-control-plane3,aa:bb:cc:dd:ee:ii,172.16.107.55,xx:yy:zz:aa:bb:ii,172.17.107.55
service_kube_node_x86_64,grp5,ABFL82,,service-kube-node1,aa:bb:cc:dd:ee:jj,172.16.107.56,xx:yy:zz:aa:bb:jj,172.17.107.56
service_kube_node_x86_64,grp5,ABKD88,,service-kube-node2,aa:bb:cc:dd:ee:kk,172.16.107.57,xx:yy:zz:aa:bb:ff,172.17.107.57


================================================
FILE: examples/rhel_software_config.json
================================================
{
    "cluster_os_type": "rhel",
    "cluster_os_version": "10.0",
    "repo_config": "partial",
    "softwares": [
        {"name": "default_packages", "arch": ["x86_64","aarch64"]},
        {"name": "admin_debug_packages", "arch": ["x86_64","aarch64"]},
        {"name": "openldap", "arch": ["x86_64","aarch64"]},
        {"name": "service_k8s","version": "1.34.1", "arch": ["x86_64"]},
        {"name": "slurm_custom", "arch": ["x86_64","aarch64"]},
        {"name": "ucx", "version": "1.19.0", "arch": ["x86_64","aarch64"]},
        {"name": "openmpi", "version": "5.0.8", "arch": ["x86_64","aarch64"]},
        {"name": "csi_driver_powerscale", "version":"v2.15.0", "arch": ["x86_64"]},
        {"name": "ldms", "arch": ["x86_64","aarch64"]},
        {"name": "additional_packages", "arch": ["x86_64","aarch64"]},
        {"name": "csi_driver_powerscale", "version":"v2.15.0", "arch": ["x86_64"]}        
    ],
    "slurm_custom": [
        {"name": "slurm_control_node"},
        {"name": "slurm_node"},
        {"name": "login_node"},
        {"name": "login_compiler_node"}
    ],
    "service_k8s": [
        {"name": "service_kube_control_plane_first"},
        {"name": "service_kube_control_plane"},
        {"name": "service_kube_node"}
    ],
    "additional_packages": [
        {"name": "slurm_control_node"},
        {"name": "slurm_node"},
        {"name": "login_node"},
        {"name": "login_compiler_node"},
        {"name": "service_kube_control_plane_first"},
        {"name": "service_kube_control_plane"},
        {"name": "service_kube_node"}        
    ]
}


================================================
FILE: examples/slurm_conf/cgroup.conf
================================================
# Sample Cgroup Configuration
# This is a sample configuration - customize according to your environment
# For more information, see https://slurm.schedmd.com/cgroup.conf.html
CgroupPlugin=autodetect
ConstrainCores=yes
ConstrainDevices=yes
ConstrainRAMSpace=yes
ConstrainSwapSpace=yes

================================================
FILE: examples/slurm_conf/slurm.conf
================================================
# Sample Slurm Configuration File
# Replace values marked with <PLACEHOLDER> with your actual values
# This is a sample configuration - customize according to your environment

# By default, Omnia merges custom configuration sources with defaults
# and existing configurations to ensure a complete and valid setup.

# For supported conf parameters, see https://slurm.schedmd.com/slurm.conf.html

# CLUSTER IDENTITY
ClusterName=slurm_cluster
SlurmctldHost=<CONTROLLER_HOSTNAME>

# AUTHENTICATION
AuthType=auth/munge
CredType=cred/munge

# SLURM USER
SlurmUser=slurm

# DIRECTORIES AND FILES
StateSaveLocation=/var/spool/slurmctld
SlurmdSpoolDir=/var/spool/slurmd
SlurmctldPidFile=/var/run/slurmctld.pid
SlurmdPidFile=/var/run/slurmd.pid
Epilog=/etc/slurm/epilog.sh

# PORTS
SlurmctldPort=6817
SlurmdPort=6818

# PLUGINS
PluginDir=/usr/lib64/slurm
ProctrackType=proctrack/cgroup
PrologFlags=contain
TaskPlugin=task/cgroup
MpiDefault=none
JobAcctGatherType=jobacct_gather/linux
JobAcctGatherFrequency=30

# SCHEDULING
SchedulerType=sched/backfill
SelectType=select/cons_tres

# TIMEOUTS
SlurmctldTimeout=120
SlurmdTimeout=300

# PARAMETERS
ReturnToService=2
SlurmctldParameters=enable_configless

# ACCOUNTING (Optional)
AccountingStorageHost=<SLURMDBD_HOSTNAME>
AccountingStoragePort=6819
AccountingStorageType=accounting_storage/slurmdbd

# COMPUTE NODES
NodeName=<NODE_HOSTNAME> Sockets=2 CoresPerSocket=8 ThreadsPerCore=2 RealMemory=32000 State=UNKNOWN

# PARTITIONS
# Define at least one partition
PartitionName=DEFAULT Nodes=ALL MaxTime=INFINITE State=UP
PartitionName=normal Nodes=<NODE_LIST> Default=YES MaxTime=INFINITE State=UP


================================================
FILE: examples/slurm_conf/slurmdbd.conf
================================================
# Sample SlurmDBD Configuration File
# Replace values marked with <PLACEHOLDER> with your actual values
# This is a sample configuration - customize according to your environment
# For more information, see https://slurm.schedmd.com/slurmdbd.conf.html

# Authentication
AuthType=auth/munge
SlurmUser=slurm

# Database Daemon Configuration
DbdHost=<DBD_HOST>
DbdPort=6819
LogFile=/var/log/slurm/slurmdbd.log
PidFile=/var/run/slurmdbd.pid
PluginDir=/usr/lib64/slurm

# Database Connection
StorageType=accounting_storage/mysql
StorageHost=<DB_HOST>
StoragePort=3306
StorageLoc=slurm_acct_db
StorageUser=slurm
StoragePass=<db_password>

================================================
FILE: examples/software_config_template/template_rhel_10.0_multi_arch_software_config.json
================================================
{
    "cluster_os_type": "rhel",
    "cluster_os_version": "10.0",
    "repo_config": "partial",
    "softwares": [
        {"name": "default_packages", "arch": ["x86_64","aarch64"]},
        {"name": "admin_debug_packages", "arch": ["x86_64","aarch64"]},
        {"name": "openldap", "arch": ["x86_64","aarch64"]},
        {"name": "slurm_custom", "arch": ["x86_64","aarch64"]},
        {"name": "service_k8s", "version": "1.34.1", "arch": ["x86_64"]},
        {"name": "ucx", "version": "1.19.0", "arch": ["x86_64","aarch64"]},
        {"name": "openmpi", "version": "5.0.8", "arch": ["x86_64","aarch64"]},
        {"name": "csi_driver_powerscale", "version":"v2.15.0", "arch": ["x86_64"]},
        {"name": "ldms", "arch": ["x86_64","aarch64"]},
        {"name": "additional_packages", "arch": ["x86_64","aarch64"]}
    ],
    "slurm_custom": [
        {"name": "slurm_control_node"},
        {"name": "slurm_node"},
        {"name": "login_node"},
        {"name": "login_compiler_node"}
    ],
    "service_k8s": [
        {"name": "service_kube_control_plane_first"},
        {"name": "service_kube_control_plane"},
        {"name": "service_kube_node"}
    ],
     "additional_packages":[
        {"name": "service_kube_control_plane_first"},
        {"name": "service_kube_control_plane"},
        {"name": "service_kube_node"},
        {"name": "slurm_control_node"},
        {"name": "slurm_node"},
        {"name": "login_node"},
        {"name": "login_compiler_node"}
    ]
}


================================================
FILE: examples/software_config_template/template_rhel_10.0_x86-64_software_config.json
================================================
{
    "cluster_os_type": "rhel",
    "cluster_os_version": "10.0",
    "repo_config": "partial",
    "softwares": [
        {"name": "default_packages", "arch": ["x86_64"]},
        {"name": "admin_debug_packages", "arch": ["x86_64"]},
        {"name": "openldap", "arch": ["x86_64"]},
        {"name": "slurm_custom", "arch": ["x86_64"]},
        {"name": "service_k8s", "version": "1.34.1", "arch": ["x86_64"]},
        {"name": "ucx", "version": "1.19.0", "arch": ["x86_64"]},
        {"name": "openmpi", "version": "5.0.8", "arch": ["x86_64"]},
        {"name": "csi_driver_powerscale", "version":"v2.15.0", "arch": ["x86_64"]},
        {"name": "ldms", "arch": ["x86_64"]},
        {"name": "additional_packages", "arch": ["x86_64"]}
    ],
    "slurm_custom": [
        {"name": "slurm_control_node"},
        {"name": "slurm_node"},
        {"name": "login_node"},
        {"name": "login_compiler_node"}
    ],
    "service_k8s": [
        {"name": "service_kube_control_plane_first"},
        {"name": "service_kube_control_plane"},
        {"name": "service_kube_node"}
    ],
     "additional_packages":[
        {"name": "service_kube_control_plane_first"},
        {"name": "service_kube_control_plane"},
        {"name": "service_kube_node"},
        {"name": "slurm_control_node"},
        {"name": "slurm_node"},
        {"name": "login_node"},
        {"name": "login_compiler_node"}
    ]
}


================================================
FILE: gitlab/ansible.cfg
================================================
[defaults]
log_path = /opt/omnia/log/core/playbooks/gitlab_build_stream.log
remote_tmp = /opt/omnia/tmp/.ansible/tmp/
host_key_checking = false
forks = 5
timeout = 180
executable = /bin/bash
library = ../common/library/modules
module_utils = ../common/library/module_utils

[persistent_connection]
command_timeout = 180
connect_timeout = 180

[ssh_connection]
retries = 3
ssh_args = -o ControlMaster=auto -o ControlPersist=60 -o ConnectTimeout=60


================================================
FILE: gitlab/cleanup_gitlab.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

---

# GitLab Comprehensive Cleanup Playbook
# This playbook removes ALL GitLab configurations created by gitlab.yml
# Usage: ansible-playbook cleanup_gitlab.yml

- name: Set_fact for fetch omnia config credentials
  hosts: localhost
  connection: local
  tags: always
  tasks:
    - name: Set dynamic run tags including 'gitlab'
      when: not config_file_status | default(false) | bool
      ansible.builtin.set_fact:
        omnia_run_tags: "{{ (ansible_run_tags | default([]) + ['provision']) | unique }}"
        cacheable: true

- name: Include input project directory
  when: not project_dir_status | default(false) | bool
  ansible.builtin.import_playbook: ../utils/include_input_dir.yml

- name: Import credential utility playbook
  ansible.builtin.import_playbook: ../utils/credential_utility/get_config_credentials.yml
  when: not config_file_status | default(false) | bool

- name: Prepare GitLab host credentials for cleanup
  hosts: localhost
  gather_facts: false
  tasks:
    - name: Load GitLab configuration inputs
      ansible.builtin.include_vars:
        file: "{{ hostvars['localhost']['input_project_dir'] }}/gitlab_config.yml"
      delegate_to: localhost
      run_once: true

    - name: Ensure gitlab_host is provided in gitlab_config.yml
      ansible.builtin.assert:
        that:
          - gitlab_host is defined
          - gitlab_host | string | length > 0
        fail_msg: "gitlab_host is not set. Provide gitlab_host in input/gitlab_config.yml"

    - name: Ensure provision password is available
      ansible.builtin.assert:
        that:
          - hostvars['localhost']['provision_password'] | default('') | length > 0
        fail_msg: "Provision password not found. Run credential utility to populate provision_password."

    - name: Register GitLab SSH credentials for cleanup
      ansible.builtin.add_host:
        name: "{{ gitlab_host }}"
        groups: gitlab_server
        ansible_host: "{{ gitlab_host }}"
        ansible_user: "{{ gitlab_ansible_user | default('root') }}"
        ansible_password: "{{ hostvars['localhost']['provision_password'] }}"
        ansible_ssh_common_args: "-o StrictHostKeyChecking=no"
        gitlab_host: "{{ gitlab_host }}"
      no_log: true

- name: Comprehensive GitLab Cleanup
  hosts: gitlab_server
  become: true
  gather_facts: true
  pre_tasks:
    - name: Load GitLab configuration inputs
      ansible.builtin.include_vars:
        file: "{{ hostvars['localhost']['input_project_dir'] }}/gitlab_config.yml"
  roles:
    - cleanup_gitlab

  post_tasks:
    - name: Gather installed packages for verification
      ansible.builtin.package_facts:
        manager: auto
      failed_when: false

    - name: Verify GitLab packages are removed
      ansible.builtin.set_fact:
        gitlab_packages_present: >-
          {{
            (
              ansible_facts.packages | default({})
            )
            | dict2items
            | selectattr('key', 'match', '^(gitlab(-|$)|gitlab-).*$')
            | list
            | length
            > 0
          }}

    - name: Verify GitLab directories are removed
      ansible.builtin.stat:
        path: "{{ item }}"
      register: gitlab_dirs_final_check
      loop:
        - "/etc/gitlab"
        - "/var/opt/gitlab"
        - "/var/log/gitlab"
      failed_when: false

    - name: Verify GitLab processes are stopped
      ansible.builtin.command: ps aux | grep gitlab | grep -v grep
      register: gitlab_processes_check
      failed_when: false
      changed_when: false

    - name: Set cleanup validation status
      ansible.builtin.set_fact:
        cleanup_validated: >-
          {{
            (not (gitlab_packages_present | default(false) | bool))
            and ((gitlab_dirs_final_check.results | selectattr('stat.exists') | list | length) == 0)
            and (gitlab_processes_check.stdout == '')
          }}


================================================
FILE: gitlab/gitlab.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

---

- name: Set_fact for fetch omnia config credentials
  hosts: localhost
  connection: local
  tags: always
  tasks:
    - name: Set dynamic run tags including 'gitlab'
      when: not config_file_status | default(false) | bool
      ansible.builtin.set_fact:
        omnia_run_tags: "{{ (ansible_run_tags | default([]) + ['gitlab'] + ['provision']) | unique }}"
        cacheable: true

- name: Include input project directory
  when: not project_dir_status | default(false) | bool
  ansible.builtin.import_playbook: ../utils/include_input_dir.yml

- name: Invoke validate_config.yml to perform L1 and L2 validations with gitlab tag
  ansible.builtin.import_playbook: ../input_validation/validate_config.yml
  tags: always

- name: Load Omnia credential utility
  ansible.builtin.import_playbook: ../utils/credential_utility/get_config_credentials.yml

- name: Create oim group and provision group
  ansible.builtin.import_playbook: ../utils/create_container_group.yml
  vars:
    oim_group: true
  tags: always

- name: Prepare GitLab host credentials from provision secrets
  hosts: localhost
  gather_facts: false
  tasks:
    - name: Prerequisite checks
      ansible.builtin.include_role:
        name: hosted_gitlab
        tasks_from: prereq_checks.yml

- name: Validate BuildStream prerequisites
  hosts: oim
  gather_facts: false
  tasks:
    - name: Prerequisite checks
      ansible.builtin.include_role:
        name: hosted_gitlab
        tasks_from: check_oim_prerequisites.yml

- name: Deploy GitLab CE on target host (hosted mode)
  hosts: gitlab_server
  become: true
  gather_facts: true
  tasks:
    - name: Bootstrap passwordless SSH
      ansible.builtin.include_role:
        name: gitlab_passwordless_ssh

    - name: Run hosted GitLab deployment
      ansible.builtin.include_role:
        name: hosted_gitlab


================================================
FILE: gitlab/roles/cleanup_gitlab/tasks/cleanup_buildstream_oauth.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

---

- name: Cleanup build stream OAuth credentials
  delegate_to: localhost
  connection: local
  run_once: true
  block:
    - name: Check if build_stream_oauth_credentials.yml exists
      ansible.builtin.stat:
        path: "{{ hostvars['localhost']['input_project_dir'] }}/build_stream_oauth_credentials.yml"
      register: oauth_file_stat

    - name: Check if vault key exists
      ansible.builtin.stat:
        path: "{{ hostvars['localhost']['input_project_dir'] }}/.build_stream_oauth_credentials_key"
      register: vault_key_stat

    - name: Handle OAuth credentials file
      when: oauth_file_stat.stat.exists
      block:
        - name: Check if credentials file is encrypted
          ansible.builtin.command: >-
            head -n 1 "{{ hostvars['localhost']['input_project_dir'] }}/build_stream_oauth_credentials.yml"
          register: oauth_header
          changed_when: false
          failed_when: false

        - name: Decrypt credentials file if encrypted
          ansible.builtin.command: >-
            ansible-vault decrypt
            --vault-password-file "{{ hostvars['localhost']['input_project_dir'] }}/.build_stream_oauth_credentials_key"
            "{{ hostvars['localhost']['input_project_dir'] }}/build_stream_oauth_credentials.yml"
          changed_when: false
          failed_when: false
          when:
            - oauth_header.stdout is defined
            - "'ANSIBLE_VAULT' in oauth_header.stdout"
            - vault_key_stat.stat.exists

        - name: Remove OAuth client section from credentials file
          ansible.builtin.replace:
            path: "{{ hostvars['localhost']['input_project_dir'] }}/build_stream_oauth_credentials.yml"
            regexp: 'oauth_clients:\n(?:[ ]{2,}.*\n)*\n?'
            replace: ''
          register: oauth_removal_result
          failed_when: false

        - name: Re-encrypt credentials file if it was encrypted
          ansible.builtin.command: >-
            ansible-vault encrypt
            --vault-password-file "{{ hostvars['localhost']['input_project_dir'] }}/.build_stream_oauth_credentials_key"
            "{{ hostvars['localhost']['input_project_dir'] }}/build_stream_oauth_credentials.yml"
          changed_when: false
          failed_when: false
          when:
            - oauth_header.stdout is defined
            - "'ANSIBLE_VAULT' in oauth_header.stdout"
            - vault_key_stat.stat.exists


================================================
FILE: gitlab/roles/cleanup_gitlab/tasks/cleanup_cicd.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

---

- name: Remove GitLab CI/CD template files
  ansible.builtin.file:
    path: "{{ item }}"
    state: absent
  loop: "{{ gitlab_cicd_template_directories }}"
  failed_when: false

- name: Remove GitLab webhook configurations
  ansible.builtin.debug:
    msg: "{{ gitlab_webhook_cleanup_note }}"
  when: gitlab_status_check.rc == 0

- name: Remove GitLab pipeline trigger files
  ansible.builtin.file:
    path: "{{ item }}"
    state: absent
  loop: "{{ gitlab_trigger_directories }}"
  failed_when: false

- name: Remove GitLab project configurations
  ansible.builtin.debug:
    msg: "{{ gitlab_project_cleanup_note }}"
  when: gitlab_status_check.rc == 0

- name: Remove GitLab API tokens (if stored locally)
  ansible.builtin.file:
    path: "{{ item }}"
    state: absent
  loop: "{{ gitlab_api_token_files }}"
  failed_when: false

- name: Clean up GitLab CI/CD cache
  ansible.builtin.file:
    path: "{{ item }}"
    state: absent
  loop: "{{ gitlab_cicd_cache_directories }}"
  failed_when: false


================================================
FILE: gitlab/roles/cleanup_gitlab/tasks/cleanup_credentials.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

---

- name: Remove GitLab initial root password file only
  ansible.builtin.file:
    path: "{{ gitlab_initial_root_password_path }}"
    state: absent
  failed_when: false

- name: Remove GitLab old password files (keep prompting system intact)
  ansible.builtin.file:
    path: "{{ item }}"
    state: absent
  loop: "{{ gitlab_old_password_files }}"
  failed_when: false

- name: Note about password prompting system
  ansible.builtin.debug:
    msg: "{{ gitlab_password_cleanup_note }}"

- name: Remove GitLab SSH known hosts entries (cleanup)
  ansible.builtin.command: "ssh-keygen -R {{ gitlab_host | default('localhost') }}"
  when: gitlab_host is defined
  changed_when: false
  failed_when: false

- name: Remove GitLab SSH keys (cleanup)
  ansible.builtin.file:
    path: "{{ item }}"
    state: absent
  loop: "{{ gitlab_ssh_host_key_files }}"
  failed_when: false

- name: Remove GitLab database encryption keys (cleanup)
  ansible.builtin.file:
    path: "{{ item }}"
    state: absent
  loop: "{{ gitlab_database_encryption_key_files }}"
  failed_when: false

- name: Clear GitLab root password from Omnia credentials file
  delegate_to: localhost
  connection: local
  run_once: true
  block:
    - name: Set credential file paths
      ansible.builtin.set_fact:
        omnia_cred_file: "{{ hostvars['localhost']['input_project_dir'] }}/omnia_config_credentials.yml"
        omnia_cred_vault_file: "{{ hostvars['localhost']['input_project_dir'] }}/.omnia_config_credentials_key"

    - name: Check if Omnia credential file exists
      ansible.builtin.stat:
        path: "{{ omnia_cred_file }}"
      register: omnia_cred_stat

    - name: Check if Omnia credential file is vault-encrypted
      ansible.builtin.command: "head -n 1 {{ omnia_cred_file }}"
      register: omnia_cred_header
      changed_when: false
      failed_when: false
      when: omnia_cred_stat.stat.exists

    - name: Check if vault password file exists
      ansible.builtin.stat:
        path: "{{ omnia_cred_vault_file }}"
      register: omnia_cred_vault_stat
      when: omnia_cred_stat.stat.exists

    - name: Decrypt Omnia credential file
      ansible.builtin.command: >-
        ansible-vault decrypt
        --vault-password-file {{ omnia_cred_vault_file }}
        {{ omnia_cred_file }}
      changed_when: false
      failed_when: false
      when:
        - omnia_cred_stat.stat.exists
        - omnia_cred_header.stdout is defined
        - "'ANSIBLE_VAULT' in omnia_cred_header.stdout"
        - omnia_cred_vault_stat.stat.exists

    - name: Blank gitlab_root_password in Omnia credential file
      ansible.builtin.lineinfile:
        path: "{{ omnia_cred_file }}"
        regexp: '^gitlab_root_password:'
        line: 'gitlab_root_password: ""'
        create: false
      failed_when: false
      when: omnia_cred_stat.stat.exists

    - name: Encrypt Omnia credential file
      ansible.builtin.command: >-
        ansible-vault encrypt
        --vault-password-file {{ omnia_cred_vault_file }}
        {{ omnia_cred_file }}
      changed_when: false
      failed_when: false
      when:
        - omnia_cred_stat.stat.exists
        - omnia_cred_header.stdout is defined
        - "'ANSIBLE_VAULT' in omnia_cred_header.stdout"
        - omnia_cred_vault_stat.stat.exists


================================================
FILE: gitlab/roles/cleanup_gitlab/tasks/cleanup_directories.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

---

- name: Remove GitLab custom directories
  ansible.builtin.file:
    path: "{{ item }}"
    state: absent
  loop: "{{ gitlab_cleanup_custom_directories }}"
  failed_when: false

- name: Remove GitLab backup directories
  ansible.builtin.file:
    path: "{{ item }}"
    state: absent
  loop: "{{ gitlab_cleanup_backup_directories }}"
  failed_when: false

- name: Remove GitLab temporary directories
  ansible.builtin.file:
    path: "{{ item }}"
    state: absent
  loop: "{{ gitlab_cleanup_temp_directories }}"
  failed_when: false

- name: Remove GitLab socket directories
  ansible.builtin.file:
    path: "{{ item }}"
    state: absent
  loop: "{{ gitlab_cleanup_socket_directories }}"
  failed_when: false

- name: Remove GitLab logrotate configuration
  ansible.builtin.file:
    path: "{{ gitlab_cleanup_logrotate_config_path }}"
    state: absent
  failed_when: false

- name: Remove GitLab cron jobs
  ansible.builtin.cron:
    name: "{{ item }}"
    state: absent
  loop: "{{ gitlab_cleanup_cron_jobs }}"
  failed_when: false


================================================
FILE: gitlab/roles/cleanup_gitlab/tasks/cleanup_packages.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

---

- name: Remove GitLab packages only (preserve system prerequisites)
  ansible.builtin.package:
    name: "{{ item }}"
    state: absent
  loop: "{{ gitlab_cleanup_packages }}"
  register: package_removal
  failed_when: false

- name: Note about preserved packages
  ansible.builtin.debug:
    msg: "{{ gitlab_preserved_packages_msg }}"

- name: Clean package cache (safe operation)
  ansible.builtin.command: "dnf clean all"
  changed_when: false
  failed_when: false

- name: Remove GitLab GPG keys
  ansible.builtin.file:
    path: "{{ item }}"
    state: absent
  loop: "{{ gitlab_gpg_key_files }}"
  failed_when: false


================================================
FILE: gitlab/roles/cleanup_gitlab/tasks/cleanup_runner.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Stop and remove GitLab runner container
  containers.podman.podman_container:
    name: "{{ gitlab_runner_container_name }}"
    state: absent
  failed_when: false

- name: Remove GitLab runner registration container
  containers.podman.podman_container:
    name: gitlab-runner-register
    state: absent
  failed_when: false

- name: Remove GitLab runner image
  containers.podman.podman_image:
    name: "{{ gitlab_runner_image }}"
    state: absent
    force: true
  failed_when: false

- name: Remove default CI job image
  containers.podman.podman_image:
    name: "{{ gitlab_runner_default_image }}"
    state: absent
    force: true
  failed_when: false

- name: Remove GitLab runner helper image
  containers.podman.podman_image:
    name: >-
      {{ gitlab_runner_helper_image_registry }}:{{
        'arm64' if ansible_architecture == 'aarch64' else 'x86_64'
      }}-{{ gitlab_runner_helper_image_version }}
    state: absent
    force: true
  failed_when: false

- name: Remove named runner volumes by filter
  ansible.builtin.shell: |
    set -o pipefail
    podman volume ls --filter name=runner -q | xargs -r podman volume rm --force
  failed_when: false
  changed_when: false

- name: Prune all stopped containers (frees anonymous job volumes)
  ansible.builtin.command: podman container prune --force
  failed_when: false
  changed_when: false

- name: Prune all remaining unused volumes
  ansible.builtin.command: podman volume prune --force
  failed_when: false
  changed_when: false

- name: Remove GitLab runner configuration directory
  ansible.builtin.file:
    path: "{{ gitlab_runner_config_path }}"
    state: absent
  failed_when: false

- name: Gather service facts
  ansible.builtin.service_facts:

- name: Remove GitLab runner systemd service
  ansible.builtin.systemd:
    name: "{{ gitlab_runner_service_name }}"
    state: stopped
    enabled: false
  when: "(gitlab_runner_service_name + '.service') in ansible_facts.services"
  failed_when: false

- name: Remove GitLab runner systemd service file
  ansible.builtin.file:
    path: "{{ gitlab_runner_systemd_service_file }}"
    state: absent
  failed_when: false

- name: Stop GitLab runner quadlet service
  ansible.builtin.systemd_service:
    name: "{{ gitlab_runner_container_name }}.service"
    state: stopped
    enabled: false
  failed_when: false

- name: Remove GitLab runner quadlet file
  ansible.builtin.file:
    path: "{{ quadlet_dir }}/{{ gitlab_runner_container_name }}.container"
    state: absent
  failed_when: false

- name: Reload systemd daemon after quadlet removal
  ansible.builtin.systemd_service:
    daemon_reload: true
  failed_when: false


================================================
FILE: gitlab/roles/cleanup_gitlab/tasks/cleanup_services.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

---

- name: Stop GitLab services
  ansible.builtin.command: "{{ gitlab_ctl_command }} stop"
  register: gitlab_stop_result
  when: gitlab_status_check.rc == 0
  retries: "{{ gitlab_cleanup_service_retries }}"
  delay: "{{ gitlab_cleanup_service_delay }}"
  until: gitlab_stop_result.rc == 0 or 'timeout' in gitlab_stop_result.stdout
  failed_when: false
  changed_when: false

- name: Force stop sidekiq if graceful stop timed out
  ansible.builtin.shell: |
    {{ gitlab_ctl_command }} stop sidekiq || true
    {{ gitlab_ctl_command }} kill sidekiq || true
    pkill -f sidekiq || true
  when:
    - gitlab_status_check.rc == 0
    - gitlab_stop_result is defined
    - gitlab_stop_result.rc != 0
    - gitlab_stop_result.stdout is defined
    - "'sidekiq' in gitlab_stop_result.stdout"
  failed_when: false
  changed_when: false

- name: Remove all GitLab packages
  ansible.builtin.package:
    name: "{{ item }}"
    state: absent
  loop: "{{ gitlab_cleanup_packages }}"
  failed_when: false

- name: Remove GitLab repository
  ansible.builtin.file:
    path: "{{ gitlab_repo_file_path }}"
    state: absent
  failed_when: false

- name: Clean GitLab directories (preserve structure)
  ansible.builtin.shell: |
    if [ -d "{{ item }}" ]; then
      find "{{ item }}" -type f -delete 2>/dev/null || true
      find "{{ item }}" -type d -empty -delete 2>/dev/null || true
    fi
  loop: "{{ gitlab_cleanup_preserve_structure_directories }}"
  failed_when: false
  changed_when: false

- name: Remove GitLab systemd services
  ansible.builtin.systemd:
    name: "{{ item }}"
    state: stopped
    enabled: false
  loop: "{{ gitlab_systemd_services }}"
  failed_when: false

- name: Stop GitLab systemd slice (best effort)
  ansible.builtin.systemd:
    name: "{{ item }}"
    state: stopped
  loop: "{{ gitlab_systemd_slices }}"
  failed_when: false
  changed_when: false

- name: Remove GitLab systemd service files
  ansible.builtin.file:
    path: "{{ gitlab_systemd_service_path }}/{{ item }}"
    state: absent
  loop: "{{ gitlab_systemd_service_files }}"
  failed_when: false

- name: Force remove any remaining GitLab directories
  ansible.builtin.file:
    path: "{{ item }}"
    state: absent
  loop: "{{ gitlab_cleanup_core_directories }}"
  failed_when: false

- name: Clean any remaining GitLab files (excluding system and user files)
  ansible.builtin.shell: >-
    find {{ gitlab_cleanup_find_roots | join(' ') }} -name '*gitlab*' -type f -delete 2>/dev/null || true
  register: gitlab_file_cleanup
  changed_when: false

- name: Remove GitLab GPG keys
  ansible.builtin.file:
    path: "{{ item }}"
    state: absent
  loop: "{{ gitlab_gpg_key_files }}"
  failed_when: false


================================================
FILE: gitlab/roles/cleanup_gitlab/tasks/cleanup_summary.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

---

- name: Display cleanup summary and quick verification tests
  ansible.builtin.debug:
    msg: "{{ gitlab_cleanup_complete_msg }}"


================================================
FILE: gitlab/roles/cleanup_gitlab/tasks/cleanup_tls.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

---

- name: Remove GitLab SSL certificates directory
  ansible.builtin.file:
    path: "{{ gitlab_ssl_certs_dir }}"
    state: absent
  failed_when: false

- name: Remove GitLab certificate generation directory
  ansible.builtin.file:
    path: "{{ gitlab_cert_dir }}"
    state: absent
  failed_when: false

- name: Remove GitLab TLS certificate files
  ansible.builtin.file:
    path: "{{ item }}"
    state: absent
  loop: "{{ gitlab_tls_certificate_files }}"
  failed_when: false

- name: Remove GitLab CA certificates from system trust store
  ansible.builtin.file:
    path: "{{ item }}"
    state: absent
  loop: "{{ gitlab_ca_trust_store_files }}"
  failed_when: false

- name: Update system CA trust store
  ansible.builtin.command: "{{ gitlab_ca_trust_update_command }}"
  register: ca_trust_update
  changed_when: false
  failed_when: false


================================================
FILE: gitlab/roles/cleanup_gitlab/tasks/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

---

# GitLab Comprehensive Cleanup Tasks
# This role cleans up ALL configurations created by GitLab playbook

- name: Display comprehensive cleanup mode message
  ansible.builtin.debug:
    msg: "{{ gitlab_comprehensive_cleanup_msg }}"

- name: Check if GitLab is installed
  ansible.builtin.command: "{{ gitlab_ctl_command }} status"
  register: gitlab_status_check
  failed_when: false
  changed_when: false

- name: Check for GitLab packages
  ansible.builtin.package_facts:
    manager: auto
  failed_when: false

- name: Check for GitLab directories
  ansible.builtin.stat:
    path: "{{ item }}"
  register: gitlab_dirs_check
  loop: "{{ gitlab_directory_check_paths }}"
  failed_when: false

# Include all cleanup tasks
- name: Cleanup GitLab services and packages
  ansible.builtin.include_tasks: cleanup_services.yml

- name: Cleanup TLS certificates
  ansible.builtin.include_tasks: cleanup_tls.yml

- name: Cleanup GitLab runner
  ansible.builtin.include_tasks: cleanup_runner.yml

- name: Cleanup directories and data
  ansible.builtin.include_tasks: cleanup_directories.yml

- name: Cleanup CI/CD configurations
  ansible.builtin.include_tasks: cleanup_cicd.yml

- name: Cleanup system packages
  ansible.builtin.include_tasks: cleanup_packages.yml

- name: Cleanup passwords and credentials
  ansible.builtin.include_tasks: cleanup_credentials.yml

- name: Cleanup build stream OAuth credentials on OIM
  ansible.builtin.include_tasks: cleanup_buildstream_oauth.yml

- name: Display cleanup summary and checklist
  ansible.builtin.include_tasks: cleanup_summary.yml


================================================
FILE: gitlab/roles/cleanup_gitlab/vars/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

---
# GitLab Omnibus paths
gitlab_rb_path: "/etc/gitlab/gitlab.rb"
gitlab_ctl_command: "gitlab-ctl"
gitlab_repo_file_path: "/etc/yum.repos.d/gitlab_gitlab-ce.repo"

# Host prerequisites
gitlab_hosted_prereq_packages:
  - curl
  - policycoreutils
  - policycoreutils-python-utils
  - openssl
  - firewalld
  - podman
  - podman-docker

# Runner container
gitlab_runner_image: "docker.io/gitlab/gitlab-runner:v18.8.0"
gitlab_runner_default_image: "docker.io/library/alpine:3.23.3"
gitlab_runner_helper_image_registry: "registry.gitlab.com/gitlab-org/gitlab-runner/gitlab-runner-helper"
gitlab_runner_helper_image_version: "v18.8.0"
gitlab_runner_container_name: "gitlab-runner"
gitlab_runner_service_name: "gitlab-runner"
gitlab_runner_systemd_service_file: "/etc/systemd/system/gitlab-runner.service"
gitlab_runner_config_path: "/srv/gitlab-runner/config"
gitlab_runner_registration_token_path: "/etc/gitlab/runner-registration-token"

# GitLab CI/CD
gitlab_ci_templates_path: "/opt/gitlab/ci_templates"

# GitLab cleanup directories
gitlab_cleanup_core_directories:
  - "/etc/gitlab"
  - "/var/opt/gitlab"
  - "/var/log/gitlab"
  - "/opt/gitlab"

# Quadlet configuration
quadlet_dir: "/etc/containers/systemd"

# GitLab cleanup packages
gitlab_cleanup_packages:
  - gitlab-ce
  - gitlab-ee
  - gitlab-ci
  - gitlab-runner

# GitLab cleanup timeouts
gitlab_cleanup_service_retries: 3
gitlab_cleanup_service_delay: 30
gitlab_systemd_service_path: "/etc/systemd/system"
gitlab_directory_check_paths:
  - "/etc/gitlab"
  - "/var/opt/gitlab"
  - "/var/log/gitlab"
gitlab_cleanup_preserve_structure_directories:
  - "/etc/gitlab"
  - "/var/opt/gitlab"
  - "/var/log/gitlab"
gitlab_cleanup_custom_directories:
  - "/opt/gitlab"
  - "/var/lib/gitlab"
  - "/home/git"
  - "/srv/gitlab"
gitlab_cleanup_backup_directories:
  - "/var/opt/gitlab/backups"
  - "/opt/gitlab_backup"
gitlab_cleanup_temp_directories:
  - "/tmp/gitlab"
  - "/var/tmp/gitlab"
gitlab_cleanup_socket_directories:
  - "/var/run/gitlab"
  - "/run/gitlab"
gitlab_cleanup_logrotate_config_path: "/etc/logrotate.d/gitlab"
gitlab_cleanup_cron_jobs:
  - gitlab-backup
  - gitlab-cleanup

# GitLab credentials cleanup
gitlab_initial_root_password_path: "/etc/gitlab/initial_root_password"
gitlab_old_password_files:
  - "/etc/gitlab/old_root_password"
  - "/tmp/gitlab_old_password"
  - "/var/opt/gitlab/old_password"
gitlab_ssh_host_key_files:
  - "/etc/gitlab/ssh_host_rsa_key"
  - "/etc/gitlab/ssh_host_rsa_key.pub"
  - "/etc/gitlab/ssh_host_ecdsa_key"
  - "/etc/gitlab/ssh_host_ecdsa_key.pub"
  - "/etc/gitlab/ssh_host_ed25519_key"
  - "/etc/gitlab/ssh_host_ed25519_key.pub"
gitlab_database_encryption_key_files:
  - "/etc/gitlab/gitlab-secrets.json"
  - "/var/opt/gitlab/.gitlab_shell_secret"
  - "/var/opt/gitlab/gitlab-rails/etc/secret"

# GitLab TLS/CA trust cleanup
gitlab_ssl_certs_dir: "/etc/gitlab/ssl"
gitlab_cert_dir: "/root/gitlab-certs"
gitlab_tls_certificate_files:
  - "/etc/gitlab/ssl/{{ gitlab_host }}.crt"
  - "/etc/gitlab/ssl/{{ gitlab_host }}.key"
  - "/etc/gitlab/ssl/ca.crt"
  - "/etc/gitlab/ssl/ca.key"
gitlab_ca_trust_store_files:
  - "/etc/pki/ca-trust/source/anchors/gitlab-ca.crt"
  - "/usr/local/share/ca-certificates/gitlab-ca.crt"
gitlab_ca_trust_update_command: update-ca-trust

# GitLab CI/CD cleanup
gitlab_cicd_template_directories:
  - "/etc/gitlab/ci_templates"
  - "/opt/gitlab/ci_templates"
  - "{{ gitlab_ci_templates_path }}"
gitlab_trigger_directories:
  - "/etc/gitlab/triggers"
  - "/opt/gitlab/triggers"
gitlab_api_token_files:
  - "/root/.gitlab_root_token"

# Debug messages
gitlab_cleanup_complete_msg:
  - "============================================"
  - "GitLab Cleanup Complete"
  - "============================================"
  - ""
  - "Quick Verification Tests:"
  - ""
  - "No GitLab packages:"
  - "  rpm -qa | grep gitlab || echo 'Clean'"
  - ""
  - "No GitLab directories:"
  - "  ls /etc/gitlab /var/opt/gitlab 2>/dev/null || echo 'Clean'"
  - ""
  - "No GitLab processes:"
  - "  ps aux | grep gitlab | grep -v grep || echo 'Clean'"
  - ""
  - "No GitLab containers:"
  - "  podman ps -a | grep gitlab || echo 'Clean'"
  - ""
  - "Components cleaned:"
  - "  - GitLab Configuration & Services"
  - "  - Custom Directories & Paths"
  - "  - Projects & API Tokens"
  - "  - Pipeline Triggers & Webhooks"
  - "  - Runner Containers & Configs"
  - "  - TLS Certificates & CA Trust"
  - "  - GitLab Packages & Repositories"
  - "  - CI/CD Templates & Files"
  - "  - Password Files & Credentials"
  - ""
  - "System status:"
  - "  - All GitLab data removed"
  - "  - Ready for smooth reinstallation"
  - ""
  - "Ready to reinstall:"
  - "  ansible-playbook gitlab.yml"
  - ""
  - "============================================"

gitlab_comprehensive_cleanup_msg:
  - "============================================"
  - "GitLab Comprehensive Cleanup Mode"
  - "============================================"
  - ""
  - "This will clean up ALL GitLab configurations:"
  - ""
  - "Components being cleaned:"
  - "  - GitLab Configuration & Services"
  - "  - Custom Directories & Paths"
  - "  - GitLab Projects & API Tokens"
  - "  - Pipeline Triggers & Webhooks"
  - "  - GitLab Runner Containers & Configs"
  - "  - TLS Certificates & CA Trust"
  - "  - GitLab Packages & Repositories"
  - "  - System Packages (Docker/Podman)"
  - "  - CI/CD Templates & Pipeline Files"
  - "  - Password Configurations"
  - ""
  - "Note: Firewall rules are preserved for system access"
  - "Result: Clean slate for fresh GitLab installation"
  - "============================================"

gitlab_webhook_cleanup_note: "Note: Webhooks and triggers are cleaned up when GitLab data is removed"

gitlab_project_cleanup_note: "Note: Projects and repositories are cleaned up when GitLab data is removed"

gitlab_password_cleanup_note: |
  Note: Only old password files removed.
  Password prompting system remains intact for fresh install.
  New root password will be prompted during next installation.

gitlab_preserved_packages_msg:
  - "System packages preserved for fresh install:"
  - "  - curl"
  - "  - policycoreutils"
  - "  - openssl"
  - "  - firewalld"
  - "  - podman"
  - "  - podman-docker"
  - ""
  - "Only GitLab-specific packages removed"

gitlab_cicd_cache_directories:
  - "/var/opt/gitlab/gitlab-ci"
  - "/var/cache/gitlab"

# GitLab services and packages cleanup
gitlab_systemd_services:
  - gitlab-runsvdir
gitlab_systemd_slices:
  - gitlab.slice
gitlab_systemd_service_files:
  - gitlab-runsvdir.service
gitlab_gpg_key_files:
  - "/etc/pki/rpm-gpg/RPM-GPG-KEY-gitlab"
  - "/etc/pki/rpm-gpg/RPM-GPG-KEY-gitlab-ce"
  - "/etc/pki/rpm-gpg/RPM-GPG-KEY-gitlab-ee"
  - "/etc/apt/trusted.gpg.d/gitlab.gpg"
gitlab_cleanup_find_roots:
  - /opt
  - /etc
  - /var
  - /root
  - /home


================================================
FILE: gitlab/roles/gitlab_passwordless_ssh/files/check_gitlab_port.sh
================================================
#!/bin/bash

# Script to check if GitLab HTTPS port is being used by non-GitLab processes
# Usage: check_gitlab_port.sh <port_number>

# Port number to check
PORT=${1:-443}

# Main logic using the exact provided approach
( curl -fsS "http://127.0.0.1:${PORT}/-/health" >/dev/null && echo "[OK] GitLab healthy on ${PORT}" && exit 0 ) \
|| if ! ss -ltn "sport = :${PORT}" | grep -q LISTEN; then
     echo "[INFO] Port ${PORT} free; starting GitLab…"
     # Note: In Ansible context, we don't actually start GitLab here
     exit 0
   else
     # Check if owner appears to be GitLab (Omnibus paths/users)
     if lsof -nP -iTCP:${PORT} -sTCP:LISTEN 2>/dev/null | grep -E '/opt/gitlab|/var/opt/gitlab|gitlab-www|gitlab-workhorse|puma' >/dev/null; then
       echo "[OK] Port ${PORT} is owned by GitLab components; continuing."
       exit 0
     else
       echo "[ERROR] Port ${PORT} is occupied by a non-GitLab process:"
       ss -ltnp "sport = :${PORT}"
       exit 1
     fi
   fi


================================================
FILE: gitlab/roles/gitlab_passwordless_ssh/tasks/authorize_key.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

---
- name: Read public key
  ansible.builtin.slurp:
    src: "{{ ssh_key_path }}.pub"
  register: gitlab_ssh_pubkey
  delegate_to: localhost
  run_once: true

- name: Authorize key on GitLab server
  ansible.posix.authorized_key:
    user: root
    key: "{{ gitlab_ssh_pubkey.content | b64decode }}"
    manage_dir: true
  become: true


================================================
FILE: gitlab/roles/gitlab_passwordless_ssh/tasks/generate_keypair.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

---
- name: Ensure .ssh directory exists on control node
  ansible.builtin.file:
    path: "{{ ssh_key_path | dirname }}"
    state: directory
    mode: '0700'
  delegate_to: localhost
  run_once: true

- name: Generate SSH keypair if missing
  ansible.builtin.command: >-
    ssh-keygen -t rsa -b 4096 -C "{{ ssh_key_comment }}" -q -N '' -f {{ ssh_key_path }}
  args:
    creates: "{{ ssh_key_path }}"
  delegate_to: localhost
  run_once: true


================================================
FILE: gitlab/roles/gitlab_passwordless_ssh/tasks/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Check prerequisites
  ansible.builtin.include_tasks: prereq_checks.yml

- name: Generate SSH keypair on control node
  ansible.builtin.include_tasks: generate_keypair.yml

- name: Authorize key on remote host
  ansible.builtin.include_tasks: authorize_key.yml

- name: Validate SSH connectivity
  ansible.builtin.include_tasks: validate_ssh.yml


================================================
FILE: gitlab/roles/gitlab_passwordless_ssh/tasks/prereq_checks.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Check repository reachability
  block:
    - name: Verify all repositories are accessible
      ansible.builtin.command: dnf makecache
      register: repo_check
      changed_when: false
  rescue:
    - name: Display detailed repository failure information
      ansible.builtin.debug:
        msg: "{{ gitlab_repo_check_fail_msg }}"

    - name: Abort playbook due to repository connectivity issues
      ansible.builtin.fail:
        msg: "{{ gitlab_repo_fail_msg }}"

- name: Install sshpass on localhost
  block:
    - name: Install sshpass package
      ansible.builtin.package:
        name: sshpass
        state: present
  rescue:
    - name: Fail with repo configuration guidance
      ansible.builtin.fail:
        msg: "{{ gitlab_sshpass_install_fail_msg }}"

- name: Load GitLab configuration inputs
  ansible.builtin.include_vars:
    file: "{{ hostvars['localhost']['input_project_dir'] }}/gitlab_config.yml"
  delegate_to: localhost
  run_once: true

- name: Copy port check script to GitLab host
  ansible.builtin.copy:
    src: files/check_gitlab_port.sh
    dest: "{{ check_gitlab_port_script }}"
    mode: '0755'
    remote_src: false

- name: Check processes using GitLab HTTPS port
  ansible.builtin.command: "{{ check_gitlab_port_script }} {{ gitlab_https_port }}"
  register: https_port_check
  changed_when: false
  failed_when: false

- name: Validate GitLab HTTPS port availability
  ansible.builtin.assert:
    that:
      - https_port_check.rc != 1
    fail_msg: "{{ gitlab_https_port_in_use_msg }}"


================================================
FILE: gitlab/roles/gitlab_passwordless_ssh/tasks/validate_ssh.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

---
- name: Check ssh connection
  ansible.builtin.command: >-
    ssh -o StrictHostKeyChecking=no -o BatchMode=yes -i {{ ssh_key_path }}
    root@{{ gitlab_host }} echo ok
  delegate_to: localhost
  run_once: true
  changed_when: false
  failed_when: false
  register: ssh_connection

- name: SSH connection failed
  ansible.builtin.fail:
    msg: "{{ ssh_connection_failure_msg }}"
  when: ssh_connection is failed


================================================
FILE: gitlab/roles/gitlab_passwordless_ssh/vars/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
# Script path
check_gitlab_port_script: "/tmp/check_gitlab_port.sh"

# Port validation error message
gitlab_https_port_in_use_msg: >
  GitLab HTTPS port {{ gitlab_https_port }} is already in use by another service.
  Please stop the conflicting service or configure GitLab to use a different port.
  You can check which process is using the port with: 'ss -tulpn | grep :{{ gitlab_https_port }}'

# Usage: prereq_checks.yml
gitlab_sshpass_install_fail_msg: >
  Failed to install sshpass. Ensure AppStream and BaseOS repositories
  are configured and enabled on this host before running this playbook.


gitlab_repo_check_fail_msg:
  - "========================================"
  - "Repository Check Failed"
  - "========================================"
  - ""
  - "One or more repositories in /etc/yum.repos.d/ are not reachable."
  - ""
  - "Command 'dnf makecache' failed with return code: {{ repo_check.rc }}"
  - ""
  - "Error output:"
  - "{{ repo_check.stderr | default('No stderr output') }}"
  - ""
  - "Please check:"
  - "- Network connectivity to repository servers"
  - "- Repository configuration in /etc/yum.repos.d/"
  - "- DNS resolution"
  - ""
  - "Run 'dnf makecache' manually to see detailed error messages."
  - "Fix repository issues before re-running gitlab.yml."
  - ""
  - "Additional solutions:"
  - "- Disable problematic repositories: dnf config-manager --set-disabled <repo-name>"
  - "- Verify proxy settings if applicable"
  - "- Run 'dnf clean all && dnf makecache' to refresh"
  - ""
  - "========================================"

gitlab_repo_fail_msg: "Repository check failed. See above error details."

# Usage: generate_keypair. yml
ssh_key_path: "/root/.ssh/omnia_gitlab"
ssh_key_comment: "omnia_gitlab"

# Usage: validate_ssh.yml
ssh_connection_failure_msg: 'Passwordless SSH to {{ gitlab_host }} failed. Verify connectivity manually.'


================================================
FILE: gitlab/roles/hosted_gitlab/files/.gitlab-ci.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
#
# BuildStream API Client -- GitLab CI/CD Pipeline
#
# Prerequisites:
#   - GitLab runner with curl and jq installed (alpine/ubuntu image works)
#   - Network access from the runner to the OIM server
#   - catalog_rhel.json in the same directory as this file
#   - GITLAB_API_TOKEN stored as a masked CI/CD variable (PAT with api scope)
#   - BSM_API_USERNAME / BSM_API_PASSWORD for first-time registration
#   - BSM_API_CERT stored as a CI/CD variable (PEM-encoded CA certificate)
#
# Token Management:
#   - Access tokens expire after 1 hour
#   - All API calls detect 401 errors (token_expired, invalid_token, missing_token)
#   - On 401, the pipeline refreshes the token and retries the failed call once
#   - Token refresh is transparent via the api_call_with_retry wrapper
#
# Usage:
#   Place this file and catalog_rhel.json in a GitLab repo.
#   The pipeline triggers on catalog_rhel.json changes or via trigger API.
# ---------------------------------------------------------------------------
# Workflow rules -- pipeline runs when catalog changes or via trigger API
# ---------------------------------------------------------------------------
workflow:
  rules:
    - changes:
        - catalog_rhel.json
    - if: '$CI_PIPELINE_SOURCE == "trigger"'

# ---------------------------------------------------------------------------
# Variables -- BSM_API_URL, BSM_API_USERNAME, BSM_API_PASSWORD,
# GITLAB_API_TOKEN, and BSM_API_CERT must be set as CI/CD project variables.
# BSM_API_CERT contains the PEM-encoded CA certificate for BSM API TLS.
# BSM_CLIENT_ID / BSM_CLIENT_SECRET are auto-stored on first registration.
# ---------------------------------------------------------------------------
variables:
  CATALOG_FILE: "catalog_rhel.json"
  POLL_INTERVAL: "30"
  MAX_POLL_ATTEMPTS: "300"
  BSM_CERT_FILE: "/tmp/bsm_api_ca.crt"
  CURL_CONNECT_TIMEOUT: "15"
  CURL_MAX_TIME: "45"

# ---------------------------------------------------------------------------
# Stages -- executed in order
# ---------------------------------------------------------------------------
stages:
  - initialization
  - parse-catalog
  - generate-input-files
  - configure-local-repository
  - build-images
  - deploy-and-validate
  - summary

# ---------------------------------------------------------------------------
# Default settings applied to every job
# ---------------------------------------------------------------------------
default:
  before_script:
    - apk add --no-cache curl jq coreutils openssl
    - |
      if [ -z "${BSM_API_CERT:-}" ]; then
        echo "ERROR: BSM_API_CERT variable is not set -- cannot verify TLS"
        exit 1
      fi
      if [ -f "${BSM_API_CERT}" ]; then
        cp "${BSM_API_CERT}" "${BSM_CERT_FILE}"
      else
        printf '%s\n' "${BSM_API_CERT}" | sed 's/\\n/\n/g' > "${BSM_CERT_FILE}"
      fi
      chmod 600 "${BSM_CERT_FILE}"

      # Strip carriage returns
      sed -i 's/\r//g' "${BSM_CERT_FILE}"

      # Validate PEM structure
      if ! grep -q "BEGIN CERTIFICATE" "${BSM_CERT_FILE}"; then
        echo "ERROR: BSM_API_CERT missing BEGIN CERTIFICATE marker"
        exit 1
      fi
      if ! grep -q "END CERTIFICATE" "${BSM_CERT_FILE}"; then
        echo "ERROR: BSM_API_CERT missing END CERTIFICATE marker"
        exit 1
      fi

      # Validate certificate with openssl
      if ! openssl x509 -in "${BSM_CERT_FILE}" -noout 2>/dev/null; then
        echo "ERROR: BSM_API_CERT is not a valid X.509 PEM certificate"
        exit 1
      fi

      # ---------------------------------------------------------------------------
      # Token Refresh Helper Function (POSIX sh compatible)
      # Refreshes ACCESS_TOKEN using CLIENT_ID / CLIENT_SECRET
      # ---------------------------------------------------------------------------
      refresh_token() {
        echo "  [TOKEN REFRESH] Requesting new access token..." >&2

        if [ -z "${CLIENT_ID:-}" ] || [ -z "${CLIENT_SECRET:-}" ]; then
          echo "  [TOKEN REFRESH] ERROR: CLIENT_ID or CLIENT_SECRET not available" >&2
          return 1
        fi

        TOKEN_HTTP_CODE=$(curl -s -o token_refresh_response.json -w "%{http_code}" \
          --connect-timeout "${CURL_CONNECT_TIMEOUT}" --max-time "${CURL_MAX_TIME}" \
          -X POST "${BSM_API_URL}/api/v1/auth/token" \
          -H "Content-Type: application/x-www-form-urlencoded" \
          -d "grant_type=client_credentials&client_id=${CLIENT_ID}&client_secret=${CLIENT_SECRET}" \
          --retry 2 --retry-delay 1 --cacert "${BSM_CERT_FILE}")

        if [ "$TOKEN_HTTP_CODE" != "200" ]; then
          echo "  [TOKEN REFRESH] ERROR: Token refresh failed (HTTP ${TOKEN_HTTP_CODE})" >&2
          cat token_refresh_response.json >&2 2>/dev/null || true
          return 1
        fi

        ACCESS_TOKEN=$(jq -r '.access_token' token_refresh_response.json)
        if [ -z "${ACCESS_TOKEN}" ] || [ "${ACCESS_TOKEN}" = "null" ]; then
          echo "  [TOKEN REFRESH] ERROR: No access_token in response" >&2
          return 1
        fi

        echo "  [TOKEN REFRESH] New token obtained successfully" >&2
        export ACCESS_TOKEN
        # Persist to temp file so parent shell can read it back (subshell export doesn't propagate)
        echo "${ACCESS_TOKEN}" > /tmp/bsm_access_token
        return 0
      }

      # ---------------------------------------------------------------------------
      # API Call Wrapper with Automatic Token Refresh (POSIX sh compatible)
      # Usage: HTTP_CODE=$(api_call_with_retry <output_file> [curl_args...])
      #
      # Detects 401 responses from verify_token():
      #   - error: token_expired  (Access token has expired)
      #   - error: invalid_token  (Invalid token signature / Invalid access token)
      #   - error: missing_token  (Authorization header is required)
      # On match, refreshes the token and retries the call once.
      #
      # The wrapper injects -H "Authorization: Bearer ${ACCESS_TOKEN}" automatically.
      # Callers must NOT pass their own Authorization header.
      # Includes timeout handling with --connect-timeout and --max-time.
      # ---------------------------------------------------------------------------
      api_call_with_retry() {
        _RETRY_OUTPUT_FILE="$1"
        shift

        # First attempt with timeout
        _RETRY_HTTP_CODE=$(curl -s -o "${_RETRY_OUTPUT_FILE}" -w "%{http_code}" \
          --connect-timeout "${CURL_CONNECT_TIMEOUT}" --max-time "${CURL_MAX_TIME}" \
          -H "Authorization: Bearer ${ACCESS_TOKEN}" "$@") || {
          _CURL_EXIT=$?
          case "$_CURL_EXIT" in
            7)
              echo "  ERROR: Connection refused - BSM API server unreachable at ${BSM_API_URL}" >&2
              ;;
            28)
              echo "  ERROR: Request timeout - BSM API server did not respond within ${CURL_MAX_TIME}s" >&2
              ;;
            6)
              echo "  ERROR: DNS resolution failed - cannot resolve BSM API hostname" >&2
              ;;
            60)
              echo "  ERROR: SSL certificate validation failed - certificate may be invalid or not trusted" >&2
              echo "  ERROR: Check BSM_API_CERT variable and ensure certificate is valid for ${BSM_API_URL}" >&2
              ;;
            *)
              echo "  ERROR: Curl failed with exit code ${_CURL_EXIT}" >&2
              ;;
          esac
          echo "000"
          return
        }

        # Only retry on 401 Unauthorized
        if [ "$_RETRY_HTTP_CODE" = "401" ]; then
          _RETRY_ERROR=$(jq -r '.detail.error // .error // ""' "${_RETRY_OUTPUT_FILE}" 2>/dev/null || echo "")

          case "${_RETRY_ERROR}" in
            token_expired|invalid_token|missing_token)
              echo "  [RETRY] 401 auth error detected: ${_RETRY_ERROR}" >&2
              if refresh_token; then
                echo "  [RETRY] Retrying API call with new token..." >&2
                _RETRY_HTTP_CODE=$(curl -s -o "${_RETRY_OUTPUT_FILE}" -w "%{http_code}" \
                  --connect-timeout "${CURL_CONNECT_TIMEOUT}" --max-time "${CURL_MAX_TIME}" \
                  -H "Authorization: Bearer ${ACCESS_TOKEN}" "$@")
                echo "  [RETRY] Retry response code: ${_RETRY_HTTP_CODE}" >&2
              else
                echo "  [RETRY] Token refresh failed -- cannot retry" >&2
              fi
              ;;
          esac
        fi

        echo "${_RETRY_HTTP_CODE}"
      }

# ============================= STAGE 1 ====================================
# Initialization -- Health Check + Authentication + Job Creation
# Performs setup tasks: verifies API connectivity, obtains access token,
# and creates a new job for the pipeline run.
# ==========================================================================
initialization:
  stage: initialization
  script:
    - |
      echo "============================================================"
      echo "  STAGE 1: Initialization"
      echo "============================================================"
      echo ""
      echo "  Step 1/3: BSM API Health Check"
      echo "  ------------------------------------------------------------"

      echo "  Checking BSM API server connectivity..."
      echo "  Endpoint: ${BSM_API_URL}/health"
      echo "  Connect timeout: ${CURL_CONNECT_TIMEOUT}s"
      echo "  Max time: ${CURL_MAX_TIME}s"
      echo ""

      # Perform health check with timeout
      HTTP_CODE=$(curl -s -o health_response.json -w "%{http_code}" \
        --connect-timeout "${CURL_CONNECT_TIMEOUT}" --max-time "${CURL_MAX_TIME}" \
        -X GET "${BSM_API_URL}/health" \
        --cacert "${BSM_CERT_FILE}" 2>&1) || {
        CURL_EXIT=$?
        echo ""
        echo "  +-----------------------------------------------------------+"
        echo "  |              BSM API HEALTH CHECK FAILED                  |"
        echo "  +-----------------------------------------------------------+"
        case "$CURL_EXIT" in
          7)
            echo "  |  Error: Connection refused                                |"
            echo "  |  The BSM API server is unreachable at:                    |"
            echo "  |  ${BSM_API_URL}"
            echo "  |                                                           |"
            echo "  |  Possible causes:                                         |"
            echo "  |  - BSM API server is not running                          |"
            echo "  |  - Firewall blocking the connection                       |"
            echo "  |  - Incorrect BSM_API_URL configured                       |"
            ;;
          28)
            echo "  |  Error: Connection timeout (${CURL_CONNECT_TIMEOUT}s)                          |"
            echo "  |  The BSM API server did not respond in time at:           |"
            echo "  |  ${BSM_API_URL}"
            echo "  |                                                           |"
            echo "  |  Possible causes:                                         |"
            echo "  |  - Network latency or routing issues                      |"
            echo "  |  - BSM API server is overloaded                           |"
            ;;
          6)
            echo "  |  Error: DNS resolution failed                             |"
            echo "  |  Cannot resolve hostname in BSM_API_URL                   |"
            ;;
          35|51|60)
            echo "  |  Error: SSL/TLS certificate verification failed           |"
            echo "  |  Check BSM_API_CERT configuration                         |"
            ;;
          *)
            echo "  |  Error: Curl failed with exit code ${CURL_EXIT}                      |"
            ;;
        esac
        echo "  +-----------------------------------------------------------+"
        echo ""
        echo "  RESULT: FAILED -- BSM API server is not reachable"
        exit 1
      }

      echo "  Health check response code: ${HTTP_CODE}"

      if [ "$HTTP_CODE" != "200" ]; then
        echo ""
        echo "  +-----------------------------------------------------------+"
        echo "  |              BSM API HEALTH CHECK FAILED                  |"
        echo "  +-----------------------------------------------------------+"
        echo "  |  Error: Unexpected response code ${HTTP_CODE}                        |"
        echo "  |  Expected: 200 OK                                         |"
        echo "  +-----------------------------------------------------------+"
        cat health_response.json 2>/dev/null || true
        echo ""
        echo "  RESULT: FAILED -- BSM API health check returned ${HTTP_CODE}"
        exit 1
      fi

      echo ""
      echo "  +-----------------------------------------------------------+"
      echo "  |              BSM API HEALTH CHECK PASSED                  |"
      echo "  +-----------------------------------------------------------+"
      echo "  |  BSM API server is reachable and healthy                  |"
      echo "  |  URL: ${BSM_API_URL}"
      echo "  +-----------------------------------------------------------+"
      echo ""
      echo "  [OK] Health check passed"
      echo ""
      echo "  Step 2/3: Authentication"
      echo "  ------------------------------------------------------------"

      # ============================= Authentication Logic ====================================
      # Authenticate: skip registration if credentials exist, else register once
      # Registration is a one-time activity. On first run the pipeline registers
      # a new OAuth client and persists CLIENT_ID / CLIENT_SECRET as GitLab
      # project-level CI/CD variables (BSM_CLIENT_ID, BSM_CLIENT_SECRET).
      # Subsequent runs skip registration and only generate a fresh access token.
      # ==========================================================================

      # --- 2a. Check for stored client credentials ---
      if [ -n "${BSM_CLIENT_ID:-}" ] && [ -n "${BSM_CLIENT_SECRET:-}" ]; then
        echo "  Stored credentials found -- skipping registration"
        echo "  CLIENT_ID: ${BSM_CLIENT_ID:0:12}..."
        CLIENT_ID="${BSM_CLIENT_ID}"
        CLIENT_SECRET="${BSM_CLIENT_SECRET}"
      else
        echo "  No stored credentials -- registering new client"

        AUTH_HEADER=$(echo -n "${BSM_API_USERNAME}:${BSM_API_PASSWORD}" | base64)
        CLIENT_NAME="gitlab-ci-client-$(date +%s)"

        echo "  Registering client: ${CLIENT_NAME}"
        echo "  Endpoint: POST ${BSM_API_URL}/api/v1/auth/register"

        HTTP_CODE=$(curl -s -o register_response.json -w "%{http_code}" \
          --connect-timeout "${CURL_CONNECT_TIMEOUT}" --max-time "${CURL_MAX_TIME}" \
          -X POST "${BSM_API_URL}/api/v1/auth/register" \
          -H "Content-Type: application/json" \
          -H "Authorization: Basic ${AUTH_HEADER}" \
          -d "{
            \"client_name\": \"${CLIENT_NAME}\",
            \"allowed_scopes\": [\"catalog:read\", \"catalog:write\", \"job:write\"],
            \"grant_types\": [\"client_credentials\"]
          }" \
          --retry 3 --retry-delay 2 --cacert "${BSM_CERT_FILE}")

        echo "  Register response code: ${HTTP_CODE}"

        if [ "$HTTP_CODE" != "201" ] && [ "$HTTP_CODE" != "200" ]; then
          echo "  ERROR: Client registration failed"
          cat register_response.json
          exit 1
        fi

        CLIENT_ID=$(jq -r '.client_id' register_response.json)
        CLIENT_SECRET=$(jq -r '.client_secret' register_response.json)
        echo "  Client registered: ${CLIENT_ID:0:12}..."

        # --- 1b. Persist credentials as GitLab CI/CD variables ---
        if [ -z "${GITLAB_API_TOKEN:-}" ]; then
          echo "  WARNING: GITLAB_API_TOKEN not set -- cannot persist credentials"
          echo "  Credentials will not survive across pipeline runs"
        else
          echo "  Persisting credentials to GitLab CI/CD variables..."

          for VAR_NAME in BSM_CLIENT_ID BSM_CLIENT_SECRET; do
            if [ "$VAR_NAME" = "BSM_CLIENT_ID" ]; then VAR_VALUE="${CLIENT_ID}"; fi
            if [ "$VAR_NAME" = "BSM_CLIENT_SECRET" ]; then VAR_VALUE="${CLIENT_SECRET}"; fi

            HTTP_CODE=$(curl -s -o /dev/null -w "%{http_code}" \
              -X POST "${CI_API_V4_URL}/projects/${CI_PROJECT_ID}/variables" \
              -H "PRIVATE-TOKEN: ${GITLAB_API_TOKEN}" \
              --form "key=${VAR_NAME}" \
              --form "value=${VAR_VALUE}" \
              --form "masked=true" \
              --form "protected=false" \
              --cacert "${CI_SERVER_TLS_CA_FILE}")

            if [ "$HTTP_CODE" = "201" ]; then
              echo "    ${VAR_NAME} stored successfully"
            else
              echo "    WARNING: Failed to store ${VAR_NAME} (HTTP ${HTTP_CODE})"
            fi
          done
        fi
      fi

      # --- 1c. Get access token (always -- tokens are short-lived) ---
      echo ""
      echo "  Requesting access token..."
      echo "  Endpoint: POST ${BSM_API_URL}/api/v1/auth/token"

      HTTP_CODE=$(curl -s -o token_response.json -w "%{http_code}" \
        --connect-timeout "${CURL_CONNECT_TIMEOUT}" --max-time "${CURL_MAX_TIME}" \
        -X POST "${BSM_API_URL}/api/v1/auth/token" \
        -H "Content-Type: application/x-www-form-urlencoded" \
        -d "grant_type=client_credentials&client_id=${CLIENT_ID}&client_secret=${CLIENT_SECRET}" \
        --retry 3 --retry-delay 2 --cacert "${BSM_CERT_FILE}")

      echo "  Token response code: ${HTTP_CODE}"

      if [ "$HTTP_CODE" != "200" ]; then
        echo "  ERROR: Token request failed"
        cat token_response.json
        exit 1
      fi

      ACCESS_TOKEN=$(jq -r '.access_token' token_response.json)
      echo "  Access token obtained: ${ACCESS_TOKEN:0:20}..."

      # --- Write credentials to dotenv artifact ---
      echo "CLIENT_ID=${CLIENT_ID}" > credentials.env
      echo "CLIENT_SECRET=${CLIENT_SECRET}" >> credentials.env
      echo "ACCESS_TOKEN=${ACCESS_TOKEN}" >> credentials.env

      echo ""
      echo "  [OK] Authentication complete"
      echo ""
      echo "  Step 3/3: Job Creation"
      echo "  ------------------------------------------------------------"

      # ============================= Job Creation Logic ====================================
      # Create a new job
      # ==========================================================================

      IDEMPOTENCY_KEY=$(cat /proc/sys/kernel/random/uuid)
      CORRELATION_ID=$(cat /proc/sys/kernel/random/uuid)

      echo "  Endpoint: POST ${BSM_API_URL}/api/v1/jobs"
      echo "  Idempotency-Key: ${IDEMPOTENCY_KEY}"

      HTTP_CODE=$(api_call_with_retry job_response.json \
        -X POST "${BSM_API_URL}/api/v1/jobs" \
        -H "Content-Type: application/json" \
        -H "Idempotency-Key: ${IDEMPOTENCY_KEY}" \
        -H "X-Correlation-ID: ${CORRELATION_ID}" \
        -d "{
          \"correlation_id\": \"${CORRELATION_ID}\",
          \"client_id\": \"${CLIENT_ID}\"
        }" \
        --retry 3 --retry-delay 2 --cacert "${BSM_CERT_FILE}")

      echo "  Response code: ${HTTP_CODE}"

      if [ "$HTTP_CODE" != "201" ] && [ "$HTTP_CODE" != "200" ]; then
        echo "  ERROR: Job creation failed"
        cat job_response.json
        exit 1
      fi

      JOB_ID=$(jq -r '.job_id' job_response.json)
      echo "  Job ID: ${JOB_ID}"

      # --- Update GitLab pipeline description with JOB_ID ---
      if [ -n "${GITLAB_API_TOKEN:-}" ]; then
        echo "  Updating pipeline description with JOB_ID..."
        curl -s -o /dev/null -w "Pipeline update: %{http_code}\n" \
          -X PUT "${CI_API_V4_URL}/projects/${CI_PROJECT_ID}/pipelines/${CI_PIPELINE_ID}" \
          -H "PRIVATE-TOKEN: ${GITLAB_API_TOKEN}" \
          -H "Content-Type: application/json" \
          -d "{\"description\": \"BSM Job: ${JOB_ID}\"}" \
          --cacert "${CI_SERVER_TLS_CA_FILE}" 2>/dev/null || true
      fi

      # --- Write job.env dotenv artifact ---
      echo "JOB_ID=${JOB_ID}" > job.env

      echo ""
      echo "  [OK] Job creation complete"
      echo ""
      echo "  ============================================================"
      echo "  INITIALIZATION COMPLETE"
      echo "  ============================================================"
      echo "  - Health Check: PASSED"
      echo "  - Authentication: COMPLETE"
      echo "  - Job Created: ${JOB_ID}"
      echo "  ============================================================"
  artifacts:
    reports:
      dotenv:
        - credentials.env
        - job.env

# ============================= STAGE 2 ====================================
# Parse Catalog -- Upload and validate catalog JSON file
# ==========================================================================
parse-catalog:
  stage: parse-catalog
  needs: [initialization]
  script:
    - |
      echo "============================================================"
      echo "  [${JOB_ID}] STAGE 2: Parse Catalog"
      echo "============================================================"
      echo ""

      # Locate catalog file relative to this CI file
      CATALOG_PATH="${CI_PROJECT_DIR}/${CATALOG_FILE}"

      if [ ! -f "${CATALOG_PATH}" ]; then
        echo "  ERROR: Catalog file not found: ${CATALOG_PATH}"
        echo "  Ensure ${CATALOG_FILE} is committed alongside .gitlab-ci.yml"
        exit 1
      fi

      CATALOG_SIZE=$(stat -c%s "${CATALOG_PATH}" 2>/dev/null || stat -f%z "${CATALOG_PATH}" 2>/dev/null)

      echo "  Uploading and parsing catalog file..."
      echo "  ------------------------------------------------------------"
      echo "  File: ${CATALOG_PATH}"
      echo "  Size: ${CATALOG_SIZE} bytes"
      echo ""
      echo "  API Request:"
      echo "  - Method: POST"
      echo "  - Endpoint: ${BSM_API_URL}/api/v1/jobs/${JOB_ID}/stages/parse-catalog"
      echo "  - Content-Type: multipart/form-data"
      echo "  - Certificate: ${BSM_CERT_FILE}"
      echo ""

      HTTP_CODE=$(api_call_with_retry parse_response.json \
        -X POST "${BSM_API_URL}/api/v1/jobs/${JOB_ID}/stages/parse-catalog" \
        -F "file=@${CATALOG_PATH};type=application/json" \
        --retry 3 --retry-delay 2 --cacert "${BSM_CERT_FILE}")

      echo "  API Response:"
      echo "  - HTTP Status Code: ${HTTP_CODE}"
      echo ""

      if [ "$HTTP_CODE" != "200" ] && [ "$HTTP_CODE" != "201" ]; then
        echo "  ERROR: Parse catalog failed"
        echo "  Response Body:"
        jq '.' parse_response.json 2>/dev/null || cat parse_response.json
        exit 1
      fi

      echo "  Response Body:"
      jq '.' parse_response.json

      echo ""
      echo "  [OK] Catalog parsed successfully"

# ============================= STAGE 3 ====================================
# Generate Input Files -- Create configuration files from parsed catalog
# ==========================================================================
generate-input-files:
  stage: generate-input-files
  needs: [initialization, parse-catalog]
  script:
    - |
      echo "============================================================"
      echo "  [${JOB_ID}] STAGE 3: Generate Input Files"
      echo "============================================================"
      echo ""

      echo "  Generating configuration files from parsed catalog..."
      echo "  ------------------------------------------------------------"
      echo ""
      echo "  API Request:"
      echo "  - Method: POST"
      echo "  - Endpoint: ${BSM_API_URL}/api/v1/jobs/${JOB_ID}/stages/generate-input-files"
      echo "  - Certificate: ${BSM_CERT_FILE}"
      echo ""

      HTTP_CODE=$(api_call_with_retry gen_response.json \
        -X POST "${BSM_API_URL}/api/v1/jobs/${JOB_ID}/stages/generate-input-files" \
        --retry 3 --retry-delay 2 --cacert "${BSM_CERT_FILE}")

      echo "  API Response:"
      echo "  - HTTP Status Code: ${HTTP_CODE}"
      echo ""

      if [ "$HTTP_CODE" != "200" ] && [ "$HTTP_CODE" != "201" ]; then
        echo "  ERROR: Generate input files failed"
        echo "  Response Body:"
        jq '.' gen_response.json 2>/dev/null || cat gen_response.json
        exit 1
      fi

      echo "  Response Body:"
      jq '.' gen_response.json

      echo ""
      echo "  [OK] Input files generated successfully"

# ============================= STAGE 4 ====================================
# Configure Local Repository -- Create and download packages to local repo
# Triggers async repository creation and polls until completion
# ==========================================================================
configure-local-repository:
  stage: configure-local-repository
  needs: [initialization, generate-input-files]
  script:
    - |
      echo "============================================================"
      echo "  [${JOB_ID}] STAGE 4: Configure Local Repository"
      echo "============================================================"
      echo ""

      echo "  Step 1/2: Trigger repository creation..."
      echo "  ------------------------------------------------------------"
      echo ""
      echo "  API Request:"
      echo "  - Method: POST"
      echo "  - Endpoint: ${BSM_API_URL}/api/v1/jobs/${JOB_ID}/stages/create-local-repository"
      echo "  - Certificate: ${BSM_CERT_FILE}"
      echo ""

      HTTP_CODE=$(api_call_with_retry repo_response.json \
        -X POST "${BSM_API_URL}/api/v1/jobs/${JOB_ID}/stages/create-local-repository" \
        --retry 3 --retry-delay 2 --cacert "${BSM_CERT_FILE}")

      echo "  API Response:"
      echo "  - HTTP Status Code: ${HTTP_CODE}"
      echo ""

      if [ "$HTTP_CODE" != "200" ] && [ "$HTTP_CODE" != "201" ] && [ "$HTTP_CODE" != "202" ]; then
        echo "  ERROR: Create local repository failed"
        echo "  Response Body:"
        jq '.' repo_response.json 2>/dev/null || cat repo_response.json
        exit 1
      fi

      echo "  Response Body:"
      jq '.' repo_response.json 2>/dev/null || cat repo_response.json
      echo ""
      echo "  [OK] Repository creation request accepted"
      echo ""

      echo "  Step 2/2: Wait for repository creation to complete..."
      echo "  ------------------------------------------------------------"
      echo "  Polling interval: ${POLL_INTERVAL}s"
      echo "  Max attempts: ${MAX_POLL_ATTEMPTS}"
      echo ""

      STAGE_COMPLETED=false
      ATTEMPT=1

      while [ "$ATTEMPT" -le "$MAX_POLL_ATTEMPTS" ]; do
        HTTP_CODE=$(api_call_with_retry status_response.json \
          -X GET "${BSM_API_URL}/api/v1/jobs/${JOB_ID}" \
          --cacert "${BSM_CERT_FILE}")
        [ -f /tmp/bsm_access_token ] && ACCESS_TOKEN=$(cat /tmp/bsm_access_token) && rm -f /tmp/bsm_access_token

        if [ "$HTTP_CODE" != "200" ]; then
          echo "  [Poll ${ATTEMPT}/${MAX_POLL_ATTEMPTS}] HTTP ${HTTP_CODE} - retrying..."
          ATTEMPT=$((ATTEMPT + 1))
          sleep "${POLL_INTERVAL}"
          continue
        fi

        REPO_STATE=$(jq -r '.stages[]? | select(.stage_name == "create-local-repository") | .stage_state' status_response.json 2>/dev/null || echo "UNKNOWN")
        JOB_STATE=$(jq -r '.job_state // "UNKNOWN"' status_response.json)

        echo "  [Poll ${ATTEMPT}/${MAX_POLL_ATTEMPTS}] Job: ${JOB_STATE} | Local-Repo Stage: ${REPO_STATE}"

        case "${REPO_STATE}" in
          COMPLETED|SUCCEEDED)
            STAGE_COMPLETED=true
            echo ""
            echo "  Final Status Response:"
            jq '.stages[]? | select(.stage_name == "create-local-repository")' status_response.json 2>/dev/null
            break
            ;;
          FAILED|CANCELLED)
            echo ""
            echo "  ERROR: Local repository stage reached ${REPO_STATE}"
            echo "  Stage Details:"
            jq '.stages[]? | select(.stage_name == "create-local-repository")' status_response.json 2>/dev/null
            exit 1
            ;;
        esac

        case "${JOB_STATE}" in
          FAILED|CANCELLED)
            echo ""
            echo "  ERROR: Job reached ${JOB_STATE} state"
            exit 1
            ;;
        esac

        ATTEMPT=$((ATTEMPT + 1))
        sleep "${POLL_INTERVAL}"
      done

      if [ "$STAGE_COMPLETED" = "false" ]; then
        echo ""
        echo "  ERROR: Polling timed out after ${MAX_POLL_ATTEMPTS} attempts"
        exit 1
      fi

      echo ""
      echo "  [OK] Local repository configured successfully"

# ============================= STAGE 5 ====================================
# Build Images -- Retrieve roles, trigger builds, and poll until completion
# Integrates role retrieval as prerequisite before building images
# ==========================================================================
build-images:
  stage: build-images
  needs: [initialization, configure-local-repository]
  script:
    - |
      echo "============================================================"
      echo "  [${JOB_ID}] STAGE 5: Build Images"
      echo "============================================================"
      echo ""

      echo "  Step 1/2: Retrieve catalog roles and image metadata..."
      echo "  ------------------------------------------------------------"
      echo ""
      echo "  API Request:"
      echo "  - Method: GET"
      echo "  - Endpoint: ${BSM_API_URL}/api/v1/jobs/${JOB_ID}/catalog/roles"
      echo "  - Certificate: ${BSM_CERT_FILE}"
      echo ""

      HTTP_CODE=$(api_call_with_retry roles_response.json \
        -X GET "${BSM_API_URL}/api/v1/jobs/${JOB_ID}/catalog/roles" \
        --retry 3 --retry-delay 2 --cacert "${BSM_CERT_FILE}")

      echo "  API Response:"
      echo "  - HTTP Status Code: ${HTTP_CODE}"
      echo ""

      if [ "$HTTP_CODE" != "200" ]; then
        echo "  ERROR: Get roles failed"
        echo "  Response Body:"
        jq '.' roles_response.json 2>/dev/null || cat roles_response.json
        exit 1
      fi

      echo "  Response Body:"
      jq '.' roles_response.json

      IMAGE_KEY=$(jq -r '.image_key' roles_response.json)
      ARCHITECTURES=$(jq -r '.architectures[]' roles_response.json)
      ROLES_JSON=$(jq -c '.roles' roles_response.json)
      ARCH_COUNT=$(jq -r '.architectures | length' roles_response.json)
      ROLE_COUNT=$(jq -r '.roles | length' roles_response.json)

      echo ""
      echo "  Extracted Metadata:"
      echo "  - Image Key: ${IMAGE_KEY}"
      echo "  - Architectures: ${ARCH_COUNT} ($(echo ${ARCHITECTURES} | tr '\n' ',' | sed 's/,$//'))"
      echo "  - Roles/Functional Groups: ${ROLE_COUNT}"
      echo ""
      echo "  [OK] Roles retrieved successfully"
      echo ""

      echo "  Step 2/2: Build images sequentially for each architecture..."
      echo "  ------------------------------------------------------------"
      echo "  Strategy: Sequential execution with fail-fast behavior"
      echo "  - Submit build for one architecture at a time"
      echo "  - Wait for completion before starting the next"
      echo "  - Exit immediately if any build fails"
      echo ""
      BUILD_COUNT=0

      for ARCH in ${ARCHITECTURES}; do
        BUILD_COUNT=$((BUILD_COUNT + 1))
        echo ""
        echo "  ============================================================"
        echo "  Build ${BUILD_COUNT}/${ARCH_COUNT}: ${ARCH}"
        echo "  ============================================================"
        echo ""

        # Determine stage name for this architecture
        STAGE_NAME="build-image-${ARCH}"

        echo "  Step 2.${BUILD_COUNT}a: Submit build request for ${ARCH}..."
        echo "  ------------------------------------------------------------"
        echo ""
        echo "  API Request:"
        echo "  - Method: POST"
        echo "  - Endpoint: ${BSM_API_URL}/api/v1/jobs/${JOB_ID}/stages/build-image"
        echo "  - Content-Type: application/json"
        echo "  - Certificate: ${BSM_CERT_FILE}"
        echo ""
        echo "  Request Payload:"
        echo "    {\"architecture\": \"${ARCH}\", \"image_key\": \"${IMAGE_KEY}\", \"functional_groups\": ${ROLES_JSON}}" | jq '.'
        echo ""

        HTTP_CODE=$(api_call_with_retry "build_response_${ARCH}.json" \
          -X POST "${BSM_API_URL}/api/v1/jobs/${JOB_ID}/stages/build-image" \
          -H "Content-Type: application/json" \
          -d "{
            \"architecture\": \"${ARCH}\",
            \"image_key\": \"${IMAGE_KEY}\",
            \"functional_groups\": ${ROLES_JSON}
          }" \
          --retry 3 --retry-delay 2 --cacert "${BSM_CERT_FILE}")

        echo "  API Response:"
        echo "  - HTTP Status Code: ${HTTP_CODE}"
        echo ""

        if [ "$HTTP_CODE" != "202" ] && [ "$HTTP_CODE" != "200" ] && [ "$HTTP_CODE" != "201" ]; then
          echo "  ERROR: Build image request failed for architecture ${ARCH}"
          echo "  Response Body:"
          jq '.' "build_response_${ARCH}.json" 2>/dev/null || cat "build_response_${ARCH}.json"
          exit 1
        fi

        echo "  Response Body:"
        jq '.' "build_response_${ARCH}.json" 2>/dev/null || cat "build_response_${ARCH}.json"
        echo ""
        echo "  [OK] Build request accepted for ${ARCH}"
        echo ""

        echo "  Step 2.${BUILD_COUNT}b: Wait for ${ARCH} build to complete..."
        echo "  ------------------------------------------------------------"
        echo "  Polling interval: ${POLL_INTERVAL}s"
        echo "  Max attempts: ${MAX_POLL_ATTEMPTS}"
        echo "  Stage name: ${STAGE_NAME}"
        echo ""

        TERMINAL_REACHED=false
        ATTEMPT=1

        while [ "$ATTEMPT" -le "$MAX_POLL_ATTEMPTS" ]; do
          HTTP_CODE=$(api_call_with_retry "status_response_${ARCH}.json" \
            -X GET "${BSM_API_URL}/api/v1/jobs/${JOB_ID}" \
            --cacert "${BSM_CERT_FILE}")
          [ -f /tmp/bsm_access_token ] && ACCESS_TOKEN=$(cat /tmp/bsm_access_token) && rm -f /tmp/bsm_access_token

          if [ "$HTTP_CODE" != "200" ]; then
            echo "  [Poll ${ATTEMPT}/${MAX_POLL_ATTEMPTS}] HTTP ${HTTP_CODE} - retrying..."
            ATTEMPT=$((ATTEMPT + 1))
            sleep "${POLL_INTERVAL}"
            continue
          fi

          # Get status of the specific stage for this architecture
          STAGE_STATE=$(jq -r ".stages[]? | select(.stage_name == \"${STAGE_NAME}\") | .stage_state" \
            "status_response_${ARCH}.json" 2>/dev/null || echo "UNKNOWN")
          JOB_STATE=$(jq -r '.job_state // "UNKNOWN"' "status_response_${ARCH}.json")

          echo "  [Poll ${ATTEMPT}/${MAX_POLL_ATTEMPTS}] Job: ${JOB_STATE} | Stage ${STAGE_NAME}: ${STAGE_STATE}"

          # Check stage state
          case "${STAGE_STATE}" in
            COMPLETED|SUCCEEDED)
              TERMINAL_REACHED=true
              echo ""
              echo "  Stage Details:"
              jq ".stages[]? | select(.stage_name == \"${STAGE_NAME}\") |
                {stage: .stage_name, state: .stage_state, started: .started_at, ended: .ended_at}" "status_response_${ARCH}.json" 2>/dev/null
              echo ""
              echo "  [OK] Build completed successfully for ${ARCH}"
              break
              ;;
            FAILED|CANCELLED)
              echo ""
              echo "  ERROR: Build-image stage reached ${STAGE_STATE} for ${ARCH}"
              echo "  Stage Details:"
              jq ".stages[]? | select(.stage_name == \"${STAGE_NAME}\")" "status_response_${ARCH}.json" 2>/dev/null
              echo ""
              echo "  Stopping sequential build process (fail-fast)"
              exit 1
              ;;
            PENDING|IN_PROGRESS|RUNNING)
              # Still in progress, continue polling
              ;;
            *)
              echo "  WARNING: Unexpected stage state: ${STAGE_STATE}"
              ;;
          esac

          # Check job state for early failure detection
          case "${JOB_STATE}" in
            FAILED|CANCELLED)
              echo ""
              echo "  ERROR: Job reached ${JOB_STATE} state"
              exit 1
              ;;
          esac

          ATTEMPT=$((ATTEMPT + 1))
          sleep "${POLL_INTERVAL}"
        done

        if [ "$TERMINAL_REACHED" = "false" ]; then
          echo ""
          echo "  ERROR: Polling timed out for ${ARCH} after ${MAX_POLL_ATTEMPTS} attempts"
          echo "  Last known stage state: ${STAGE_STATE}"
          exit 1
        fi

        echo ""
      done

      echo ""
      echo "  ============================================================"
      echo "  [OK] All ${BUILD_COUNT} image(s) built successfully"
      echo "  ============================================================"
  artifacts:
    paths:
      - roles_response.json

# ============================= STAGE 6 ====================================
# Deploy and Validate Images -- Deploy to test environment and validate
# Triggers validation and polls until completion
# ==========================================================================
deploy-and-validate:
  stage: deploy-and-validate
  needs: [initialization, build-images]
  script:
    - |
      echo "============================================================"
      echo "  [${JOB_ID}] STAGE 6: Deploy and Validate Images"
      echo "============================================================"
      echo ""

      # Extract IMAGE_KEY from roles_response.json artifact
      if [ ! -f roles_response.json ]; then
        echo "  ERROR: roles_response.json artifact not found"
        exit 1
      fi

      IMAGE_KEY=$(jq -r '.image_key' roles_response.json)

      echo "  Step 1/2: Trigger image validation on test environment..."
      echo "  ------------------------------------------------------------"
      echo "  Image Key: ${IMAGE_KEY}"
      echo ""
      echo "  API Request:"
      echo "  - Method: POST"
      echo "  - Endpoint: ${BSM_API_URL}/api/v1/jobs/${JOB_ID}/stages/validate-image-on-test"
      echo "  - Content-Type: application/json"
      echo "  - Certificate: ${BSM_CERT_FILE}"
      echo ""
      echo "  Request Payload:"
      echo "    {\"image_key\": \"${IMAGE_KEY}\"}" | jq '.'
      echo ""

      HTTP_CODE=$(api_call_with_retry validate_response.json \
        -X POST "${BSM_API_URL}/api/v1/jobs/${JOB_ID}/stages/validate-image-on-test" \
        -H "Content-Type: application/json" \
        -d "{\"image_key\": \"${IMAGE_KEY}\"}" \
        --retry 3 --retry-delay 2 --cacert "${BSM_CERT_FILE}")

      echo "  API Response:"
      echo "  - HTTP Status Code: ${HTTP_CODE}"
      echo ""

      if [ "$HTTP_CODE" != "202" ] && [ "$HTTP_CODE" != "200" ] && [ "$HTTP_CODE" != "201" ]; then
        echo "  ERROR: Validate image on test failed"
        echo "  Response Body:"
        jq '.' validate_response.json 2>/dev/null || cat validate_response.json
        exit 1
      fi

      echo "  Response Body:"
      jq '.' validate_response.json 2>/dev/null || cat validate_response.json
      echo ""
      echo "  [OK] Validation request accepted"
      echo ""

      echo "  Step 2/2: Wait for validation to complete..."
      echo "  ------------------------------------------------------------"
      echo "  Polling interval: ${POLL_INTERVAL}s"
      echo "  Max attempts: ${MAX_POLL_ATTEMPTS}"
      echo ""

      STAGE_COMPLETED=false
      ATTEMPT=1

      while [ "$ATTEMPT" -le "$MAX_POLL_ATTEMPTS" ]; do
        HTTP_CODE=$(api_call_with_retry status_response.json \
          -X GET "${BSM_API_URL}/api/v1/jobs/${JOB_ID}" \
          --cacert "${BSM_CERT_FILE}")
        [ -f /tmp/bsm_access_token ] && ACCESS_TOKEN=$(cat /tmp/bsm_access_token) && rm -f /tmp/bsm_access_token

        if [ "$HTTP_CODE" != "200" ]; then
          echo "  [Poll ${ATTEMPT}/${MAX_POLL_ATTEMPTS}] HTTP ${HTTP_CODE} - retrying..."
          ATTEMPT=$((ATTEMPT + 1))
          sleep "${POLL_INTERVAL}"
          continue
        fi

        VALIDATE_STATE=$(jq -r '.stages[]? | select(.stage_name == "validate-image-on-test") | .stage_state' status_response.json 2>/dev/null || echo "UNKNOWN")
        JOB_STATE=$(jq -r '.job_state // "UNKNOWN"' status_response.json)

        echo "  [Poll ${ATTEMPT}/${MAX_POLL_ATTEMPTS}] Job: ${JOB_STATE} | Validation Stage: ${VALIDATE_STATE}"

        case "${VALIDATE_STATE}" in
          COMPLETED|SUCCEEDED)
            STAGE_COMPLETED=true
            echo ""
            echo "  Final Validation Status:"
            jq '.stages[]? | select(.stage_name == "validate-image-on-test") |
              {stage: .stage_name, state: .stage_state, started: .started_at, ended: .ended_at}' status_response.json 2>/dev/null
            break
            ;;
          FAILED|CANCELLED)
            echo ""
            echo "  ERROR: Validation stage reached ${VALIDATE_STATE}"
            echo "  Stage Details:"
            jq '.stages[]? | select(.stage_name == "validate-image-on-test")' status_response.json 2>/dev/null
            exit 1
            ;;
          SKIPPED)
            echo ""
            echo "  INFO: Validation stage was SKIPPED"
            jq '.stages[]? | select(.stage_name == "validate-image-on-test")' status_response.json 2>/dev/null
            STAGE_COMPLETED=true
            break
            ;;
        esac

        case "${JOB_STATE}" in
          FAILED|CANCELLED)
            echo ""
            echo "  ERROR: Job reached ${JOB_STATE} state"
            exit 1
            ;;
          SUCCEEDED|COMPLETED)
            STAGE_COMPLETED=true
            break
            ;;
        esac

        ATTEMPT=$((ATTEMPT + 1))
        sleep "${POLL_INTERVAL}"
      done

      if [ "$STAGE_COMPLETED" = "false" ]; then
        echo ""
        echo "  ERROR: Polling timed out after ${MAX_POLL_ATTEMPTS} attempts"
        exit 1
      fi

      echo ""
      echo "  [OK] Images deployed and validated successfully"

# ============================= STAGE 7 ====================================
# Summary -- Fetch final job status and display comprehensive results
# Runs after any stage (success or failure) to provide complete pipeline summary
# ==========================================================================
summary:
  stage: summary
  needs: [initialization, parse-catalog, generate-input-files, configure-local-repository,
          build-images, deploy-and-validate]
  when: always
  script:
    - |
      echo "============================================================"
      echo "  STAGE 7: Pipeline Summary"
      echo "============================================================"

      # Check if we have a job ID (might not if auth or create-job failed)
      if [ -z "${JOB_ID:-}" ]; then
        echo "  No job ID available - pipeline likely failed before job creation"
        echo ""
        echo "  +-----------------------------------------------------------+"
        echo "  |                  BSM PIPELINE SUMMARY                     |"
        echo "  +-----------------------------------------------------------+"
        echo "  |  Job ID:     NOT AVAILABLE                                |"
        echo "  |  Job State:  FAILED                                       |"
        echo "  |  Reason:     Authentication or job creation failed        |"
        echo "  +-----------------------------------------------------------+"
        exit 1
      fi

      echo "  Job ID: ${JOB_ID}"
      echo "  Fetching final job status..."

      HTTP_CODE=$(api_call_with_retry final_status.json \
        -X GET "${BSM_API_URL}/api/v1/jobs/${JOB_ID}" \
        --cacert "${BSM_CERT_FILE}")

      if [ "$HTTP_CODE" != "200" ]; then
        echo "  WARNING: Failed to fetch final job status (HTTP ${HTTP_CODE})"
        echo ""
        echo "  +-----------------------------------------------------------+"
        echo "  |                  BSM PIPELINE SUMMARY                     |"
        echo "  +-----------------------------------------------------------+"
        echo "  |  Job ID:     ${JOB_ID}"
        echo "  |  Job State:  FAILED (API returned ${HTTP_CODE})"
        echo "  +-----------------------------------------------------------+"
        exit 1
      fi

      echo "  Job status fetched successfully"
      echo ""

      JOB_STATE=$(jq -r '.job_state // "UNKNOWN"' final_status.json)
      TOTAL_STAGES=$(jq -r '.stages | length' final_status.json 2>/dev/null || echo "0")
      COMPLETED=$(jq -r '[.stages[]? | select(.stage_state == "COMPLETED" or .stage_state == "SUCCEEDED")] | length' final_status.json 2>/dev/null || echo "0")
      FAILED=$(jq -r '[.stages[]? | select(.stage_state == "FAILED")] | length' final_status.json 2>/dev/null || echo "0")
      SKIPPED=$(jq -r '[.stages[]? | select(.stage_state == "SKIPPED")] | length' final_status.json 2>/dev/null || echo "0")
      PENDING=$(jq -r '[.stages[]? | select(.stage_state == "PENDING" or .stage_state == "IN_PROGRESS")] | length' final_status.json 2>/dev/null || echo "0")

      # Determine final display state based on actual results
      if [ "$FAILED" -gt 0 ] || [ "$JOB_STATE" = "FAILED" ]; then
        DISPLAY_STATE="FAILED"
      elif [ "$JOB_STATE" = "COMPLETED" ] || [ "$JOB_STATE" = "SUCCEEDED" ]; then
        DISPLAY_STATE="SUCCESS"
      elif [ "$JOB_STATE" = "IN_PROGRESS" ] || [ "$JOB_STATE" = "RUNNING" ]; then
        # If job is still running but all stages completed, show SUCCESS
        if [ "$PENDING" -eq 0 ] && [ "$COMPLETED" -gt 0 ]; then
          DISPLAY_STATE="SUCCESS"
        else
          DISPLAY_STATE="IN_PROGRESS"
        fi
      else
        DISPLAY_STATE="${JOB_STATE}"
      fi

      echo "  +-----------------------------------------------------------+"
      echo "  |                  BSM PIPELINE SUMMARY                     |"
      echo "  +-----------------------------------------------------------+"
      echo "  |  Job ID:     ${JOB_ID}"
      echo "  |  Job State:  ${DISPLAY_STATE}"
      echo "  |  Stages:     ${TOTAL_STAGES} total (${COMPLETED} ok, ${FAILED} failed, ${SKIPPED} skipped, ${PENDING} pending)"
      echo "  +-----------------------------------------------------------+"
      echo "  |  Stage Results:                                           |"

      # Sort stages in chronological execution order
      jq -r '
        # Define stage execution order
        def stage_order:
          {
            "parse-catalog": 1,
            "generate-input-files": 2,
            "create-local-repository": 3,
            "build-image-x86_64": 4,
            "build-image-aarch64": 4,
            "validate-image-on-test": 5
          };

        # Sort stages by execution order, then by name
        .stages | sort_by([stage_order[.stage_name] // 999, .stage_name])[] |
        "  |    \(.stage_name): \(.stage_state)" +
        (if .error_code then "  [\(.error_code)]" else "" end)
      ' final_status.json 2>/dev/null || echo "  |    (no stage data)"

      echo "  +-----------------------------------------------------------+"

      # Print errors if any
      ERRORS=$(jq -r '.stages[]? | select(.stage_state == "FAILED") |
                     "  |    X \(.stage_name): " +
                     (.error_summary // "no details")' final_status.json 2>/dev/null)
      if [ -n "${ERRORS}" ]; then
        echo "  |  Errors:                                                |"
        echo "${ERRORS}"
        echo "  +-----------------------------------------------------------+"
      fi

      echo "  +-----------------------------------------------------------+"
      echo ""

      if [ "$DISPLAY_STATE" = "FAILED" ]; then
        echo "  RESULT: FAILED -- ${FAILED} stage(s) failed"
        exit 1
      fi

      echo "  RESULT: SUCCESS -- all stages completed"
  artifacts:
    paths:
      - final_status.json


================================================
FILE: gitlab/roles/hosted_gitlab/tasks/check_oim_prerequisites.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Set build_stream_host_ip fact from localhost
  ansible.builtin.set_fact:
    build_stream_host_ip: "{{ hostvars['localhost']['build_stream_host_ip'] }}"

- name: Check if playbook_watcher service is running
  ansible.builtin.systemd_service:
    name: playbook_watcher.service
  register: watcher_service_status
  failed_when: false

- name: Fail if playbook_watcher service is not running
  ansible.builtin.fail:
    msg: "{{ gitlab_watcher_not_running_msg }}"
  when: >
    watcher_service_status.status is not defined or
    watcher_service_status.status.ActiveState != 'active'

- name: Check if omnia_build_stream service is running
  ansible.builtin.systemd_service:
    name: omnia_build_stream.service
  register: build_stream_service_status
  failed_when: false

- name: Fail if omnia_build_stream service is not running
  ansible.builtin.fail:
    msg: "{{ gitlab_build_stream_not_running_msg }}"
  when: >
    build_stream_service_status.status is not defined or
    build_stream_service_status.status.ActiveState != 'active'

- name: Check if omnia_postgres container is running
  ansible.builtin.systemd_service:
    name: omnia_postgres.service
  register: postgres_service_status
  failed_when: false

- name: Fail if omnia_postgres container is not running
  ansible.builtin.fail:
    msg: "{{ gitlab_postgres_not_running_msg }}"
  when: >
    postgres_service_status.status is not defined or
    postgres_service_status.status.ActiveState != 'active'

- name: Check if build stream SSL certificate exists
  ansible.builtin.stat:
    path: "{{ gitlab_bs_cert_path }}"
  register: bs_cert_stat
  delegate_to: localhost
  connection: local

- name: Fail if build stream SSL certificate is missing
  ansible.builtin.fail:
    msg: "{{ gitlab_bs_cert_missing_msg }}"
  when: not bs_cert_stat.stat.exists


================================================
FILE: gitlab/roles/hosted_gitlab/tasks/configure_firewall.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

---

- name: Install firewalld
  ansible.builtin.package:
    name: firewalld
    state: present

- name: Ensure firewalld is running
  ansible.builtin.service:
    name: firewalld
    state: started
    enabled: true

- name: Open required ports
  ansible.posix.firewalld:
    port: "{{ item }}/tcp"
    permanent: true
    immediate: true
    state: enabled
  loop:
    - "{{ gitlab_https_port }}"
    - "{{ gitlab_ssh_port }}"

- name: Reload firewalld to apply rules
  ansible.builtin.command: firewall-cmd --reload
  changed_when: false


================================================
FILE: gitlab/roles/hosted_gitlab/tasks/configure_gitlab.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

---

- name: Set external URL
  ansible.builtin.set_fact:
    gitlab_external_url_computed: "https://{{ gitlab_host }}{% if gitlab_https_port != 443 %}:{{ gitlab_https_port }}{% endif %}"

- name: Configure gitlab.rb from template
  ansible.builtin.template:
    src: gitlab.rb.j2
    dest: "{{ gitlab_rb_path }}"
    backup: true
    mode: '0600'

- name: Ensure git user exists
  ansible.builtin.user:
    name: "{{ gitlab_system_user_name }}"
    shell: "{{ gitlab_system_user_shell }}"
    home: "{{ gitlab_system_user_home }}"
    create_home: "{{ gitlab_system_user_create_home }}"
    state: present

- name: Ensure GitLab directories exist
  ansible.builtin.file:
    path: "{{ item }}"
    state: directory
    owner: root
    group: root
    mode: '0755'
  loop: "{{ gitlab_directories }}"

- name: Ensure gitlab-runsvdir is enabled and started (required for runit sockets)
  ansible.builtin.systemd:
    name: gitlab-runsvdir
    enabled: true
    state: started
    daemon_reload: true
  failed_when: false
  changed_when: false

- name: Reconfigure GitLab
  ansible.builtin.command: "{{ gitlab_ctl_command }} reconfigure"
  async: "{{ gitlab_reconfigure_async }}"
  poll: "{{ gitlab_reconfigure_poll }}"
  register: gitlab_reconfigure
  changed_when: false
  failed_when: gitlab_reconfigure.rc is defined and gitlab_reconfigure.rc != 0

- name: Wait for GitLab HTTPS port to be ready
  ansible.builtin.wait_for:
    host: 127.0.0.1
    port: "{{ gitlab_https_port | int }}"
    delay: 5
    timeout: "{{ (gitlab_startup_wait_minutes | int) * 60 }}"

- name: Health check
  ansible.builtin.command: "{{ gitlab_ctl_command }} status"
  register: gitlab_status
  retries: "{{ gitlab_health_check_retries }}"
  delay: "{{ gitlab_health_check_delay }}"
  until: gitlab_status.rc == 0
  changed_when: false

- name: Wait for GitLab API to be ready
  block:
    - name: Probe GitLab API version endpoint
      ansible.builtin.uri:
        url: "{{ gitlab_external_url_computed }}/api/v4/version"
        method: GET
        validate_certs: false
        status_code: "{{ gitlab_default_status_codes.api_version }}"
      register: gitlab_api_check
      retries: "{{ gitlab_api_check_retries }}"
      delay: "{{ gitlab_api_check_delay }}"
      until: gitlab_api_check.status in gitlab_default_status_codes.api_version
      changed_when: false
  rescue:
    - name: Fail when GitLab API is unreachable
      ansible.builtin.fail:
        msg: "{{ gitlab_api_ready_failure_msg }}"

- name: Clean up initial root password file
  ansible.builtin.file:
    path: "{{ gitlab_initial_root_password_path }}"
    state: absent
  when:
    - gitlab_root_password is defined
    - gitlab_root_password | length > 0
  no_log: true


================================================
FILE: gitlab/roles/hosted_gitlab/tasks/create_directories.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

---

- name: Create GitLab directories
  ansible.builtin.file:
    path: "{{ item }}"
    state: directory
    mode: '0755'
  loop:
    - "{{ gitlab_ssl_dir }}"
    - "{{ gitlab_cert_dir }}"
    - "{{ gitlab_runner_config_path }}"
    - "{{ gitlab_runner_config_path }}/certs"


================================================
FILE: gitlab/roles/hosted_gitlab/tasks/create_project.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

---
- name: Wait for GitLab API to be ready
  block:
    - name: Probe GitLab API version endpoint
      ansible.builtin.uri:
        url: "{{ gitlab_external_url_computed }}/api/v4/version"
        method: GET
        validate_certs: false
        status_code: "{{ gitlab_default_status_codes.api_version }}"
      register: api_check
      retries: "{{ gitlab_api_check_retries }}"
      delay: "{{ gitlab_api_check_delay }}"
      until: api_check.status in gitlab_default_status_codes.api_version
  rescue:
    - name: Fail when GitLab API remains unreachable
      ansible.builtin.fail:
        msg: "{{ gitlab_api_ready_failure_msg }}"

- name: Get root user API token
  ansible.builtin.shell: |
    gitlab-rails runner "
      token = User.find_by_username('root').personal_access_tokens.create(
        scopes: [:api, :write_repository],
        name: 'omnia-automation',
        expires_at: {{ gitlab_root_token_expiry_days }}.days.from_now
      )
      token.set_token('omnia-' + SecureRandom.hex(20))
      token.save!
      puts token.token
    "
  register: root_token_output
  changed_when: false
  no_log: true

- name: Set root API token fact
  ansible.builtin.set_fact:
    gitlab_root_token: "{{ root_token_output.stdout | trim }}"
  no_log: true

- name: Save root API token to disk
  ansible.builtin.copy:
    content: "{{ gitlab_root_token }}"
    dest: "{{ gitlab_root_token_file_path }}"
    mode: '0600'
  no_log: true

- name: Check if project exists
  block:
    - name: Query GitLab for existing project
      ansible.builtin.uri:
        url: "{{ gitlab_external_url_computed }}/api/v4/projects?search={{ gitlab_project_name }}"
        method: GET
        headers:
          PRIVATE-TOKEN: "{{ gitlab_root_token }}"
        validate_certs: false
        status_code: "{{ gitlab_default_status_codes.project_search }}"
      register: project_search
      no_log: true
  rescue:
    - name: Fail when project search API call fails
      ansible.builtin.fail:
        msg: "{{ gitlab_project_search_failure_msg }}"

- name: Set project exists flag
  ansible.builtin.set_fact:
    project_exists: "{{ (project_search.json | length > 0) and (project_search.json[0].name == gitlab_project_name) }}"

- name: Create GitLab project when missing
  when: not project_exists
  block:
    - name: Create project via GitLab API
      ansible.builtin.uri:
        url: "{{ gitlab_external_url_computed }}/api/v4/projects"
        method: POST
        headers:
          PRIVATE-TOKEN: "{{ gitlab_root_token }}"
        body_format: json
        body:
          name: "{{ gitlab_project_name }}"
          visibility: "{{ gitlab_project_visibility }}"
          initialize_with_readme: true
          default_branch: "{{ gitlab_default_branch }}"
        status_code: "{{ gitlab_default_status_codes.project_create }}"
        validate_certs: false
      register: new_project
      no_log: true
  rescue:
    - name: Fail when project creation API call fails
      ansible.builtin.fail:
        msg: "{{ gitlab_project_create_failure_msg }}"

- name: Set project ID and URL
  ansible.builtin.set_fact:
    gitlab_project_id: "{{ (new_project.json.id if not project_exists else project_search.json[0].id) | string }}"
    gitlab_project_url: "{{ new_project.json.web_url if not project_exists else project_search.json[0].web_url }}"
    gitlab_project_http_url: "{{ new_project.json.http_url_to_repo if not project_exists else project_search.json[0].http_url_to_repo }}"

- name: Set project CI/CD job timeout
  block:
    - name: Update project job timeout via GitLab API
      ansible.builtin.uri:
        url: "{{ gitlab_external_url_computed }}/api/v4/projects/{{ gitlab_project_id }}"
        method: PUT
        headers:
          PRIVATE-TOKEN: "{{ gitlab_root_token }}"
        body_format: json
        body:
          build_timeout: "{{ gitlab_project_ci_timeout }}"
        status_code: "{{ gitlab_default_status_codes.project_update }}"
        validate_certs: false
      no_log: true
  rescue:
    - name: Fail when project timeout update API call fails
      ansible.builtin.fail:
        msg: "{{ gitlab_project_timeout_failure_msg }}"

- name: Check if runner config exists
  ansible.builtin.stat:
    path: "{{ gitlab_runner_config_file }}"
  register: gitlab_runner_config_stat_check
  failed_when: false

- name: Create runner authentication token via API
  when: not gitlab_runner_config_stat_check.stat.exists
  block:
    - name: Request runner authentication token
      ansible.builtin.uri:
        url: "{{ gitlab_external_url_computed }}/api/v4/user/runners"
        method: POST
        headers:
          PRIVATE-TOKEN: "{{ gitlab_root_token }}"
        body_format: json
        body:
          runner_type: project_type
          project_id: "{{ gitlab_project_id }}"
          description: "{{ gitlab_runner_description }}"
          tag_list:
            - "{{ gitlab_runner_tags }}"
          run_untagged: true
        validate_certs: false
        status_code: "{{ gitlab_default_status_codes.runner_create }}"
      register: runner_creation
      no_log: true
  rescue:
    - name: Fail when runner token API call fails
      ansible.builtin.fail:
        msg: "{{ gitlab_runner_token_failure_msg }}"

- name: Set runner authentication token fact
  ansible.builtin.set_fact:
    gitlab_runner_auth_token: "{{ runner_creation.json.token }}"
  no_log: true
  when: not gitlab_runner_config_stat_check.stat.exists


================================================
FILE: gitlab/roles/hosted_gitlab/tasks/create_trigger.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

---

- name: Check existing triggers
  ansible.builtin.uri:
    url: "{{ gitlab_external_url_computed }}/api/v4/projects/{{ gitlab_project_id }}/triggers"
    method: GET
    headers:
      PRIVATE-TOKEN: "{{ gitlab_root_token }}"
    validate_certs: false
    status_code: 200
  register: existing_triggers
  no_log: true

- name: Check if trigger exists
  ansible.builtin.set_fact:
    trigger_exists: "{{ existing_triggers.json | selectattr('description', 'equalto', gitlab_trigger_description) | list | length > 0 }}"

- name: Create pipeline trigger
  ansible.builtin.uri:
    url: "{{ gitlab_external_url_computed }}/api/v4/projects/{{ gitlab_project_id }}/triggers"
    method: POST
    headers:
      PRIVATE-TOKEN: "{{ gitlab_root_token }}"
    body_format: json
    body:
      description: "{{ gitlab_trigger_description }}"
    status_code: [200, 201]
    validate_certs: false
  register: new_trigger
  no_log: true
  when: not trigger_exists

- name: Set trigger token fact
  ansible.builtin.set_fact:
    gitlab_trigger_token: >-
      {{
        new_trigger.json.token
        if not trigger_exists
        else (
          existing_triggers.json
          | selectattr('description', 'equalto', gitlab_trigger_description)
          | first
        ).token
      }}
  no_log: true

- name: Save trigger token to file
  ansible.builtin.copy:
    content: "{{ gitlab_trigger_token }}"
    dest: "/root/.gitlab_trigger_token"
    mode: '0600'
  no_log: true


================================================
FILE: gitlab/roles/hosted_gitlab/tasks/deploy_runner.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

- name: Determine SELinux volume suffix and helper image arch
  ansible.builtin.set_fact:
    gitlab_runner_volume_suffix: "{{ ':z' if ansible_selinux is defined and ansible_selinux.status == 'enabled' else '' }}"
    gitlab_runner_helper_arch: "{{ 'arm64' if ansible_architecture == 'aarch64' else 'x86_64' }}"

- name: Resolve helper image tag
  ansible.builtin.set_fact:
    gitlab_runner_helper_image_resolved: >-
      {{ gitlab_runner_helper_image_registry }}:{{ gitlab_runner_helper_arch
        }}-{{ gitlab_runner_image | regex_search('v[0-9]+\.[0-9]+\.[0-9]+') | default(gitlab_runner_helper_image_version) }}

- name: Check if runner container is currently running
  containers.podman.podman_container_info:
    name: "{{ gitlab_runner_container_name }}"
  register: runner_container_info
  failed_when: false

- name: Set runner image force-pull flag
  ansible.builtin.set_fact:
    _runner_force_pull: >-
      {{ (force_re_register_runner | bool)
         or (runner_container_info.containers | default([]) | length == 0)
         or (runner_container_info.containers[0].State.Status | default('') != 'running') }}

- name: Pull GitLab runner image (force if container not running or flag set)
  block:
    - name: Pull GitLab runner image
      containers.podman.podman_image:
        name: "{{ gitlab_runner_image }}"
        state: present
        force: "{{ _runner_force_pull | bool }}"
      register: _runner_image_pull
      until: _runner_image_pull is succeeded
      retries: "{{ gitlab_image_pull_retries }}"
      delay: "{{ gitlab_image_pull_delay }}"
  rescue:
    - name: Fail with detailed error message for runner image
      ansible.builtin.fail:
        msg: "{{ gitlab_runner_image_pull_fail_msg }}"

- name: Pull GitLab runner helper image (always force to avoid stale cache)
  block:
    - name: Pull GitLab runner helper image
      containers.podman.podman_image:
        name: "{{ gitlab_runner_helper_image_resolved }}"
        state: present
        force: true
      register: _helper_image_pull
      until: _helper_image_pull is succeeded
      retries: "{{ gitlab_image_pull_retries }}"
      delay: "{{ gitlab_image_pull_delay }}"
  rescue:
    - name: Fail with detailed error message for helper image
      ansible.builtin.fail:
        msg: "{{ gitlab_helper_image_pull_fail_msg }}"

- name: Pull default CI job image
  block:
    - name: Pull default CI job image
      containers.podman.podman_image:
        name: "{{ gitlab_runner_default_image }}"
        state: present
      register: _default_image_pull
      until: _default_image_pull is succeeded
      retries: "{{ gitlab_image_pull_retries }}"
      delay: "{{ gitlab_image_pull_delay }}"
  rescue:
    - name: Fail with detailed error message for default image
      ansible.builtin.fail:
        msg: "{{ gitlab_default_image_pull_fail_msg }}"

- name: Ensure runner config directory exists
  ansible.builtin.file:
    path: "{{ gitlab_runner_config_path }}"
    state: directory
    mode: '0755'

- name: Check if runner already registered
  ansible.builtin.stat:
    path: "{{ gitlab_runner_config_file }}"
  register: gitlab_runner_config_stat

- name: Ensure runner container is absent before first registration
  containers.podman.podman_container:
    name: "{{ gitlab_runner_container_name }}"
    state: absent
  when: not gitlab_runner_config_stat.stat.exists

- name: Register GitLab runner with authentication token
  containers.podman.podman_container:
    name: gitlab-runner-register
    image: "{{ gitlab_runner_image }}"
    state: started
    detach: false
    rm: true
    command:
      - register
      - --non-interactive
      - --url
      - "{{ gitlab_external_url_computed }}/"
      - --token
      - "{{ gitlab_runner_auth_token }}"
      - --executor
      - "{{ gitlab_runner_executor }}"
      - --docker-image
      - "{{ gitlab_runner_default_image }}"
      - --docker-pull-policy
      - "{{ gitlab_runner_pull_policy }}"
      - --docker-helper-image
      - "{{ gitlab_runner_helper_image_resolved }}"
      - --docker-disable-cache
      - --description
      - "{{ gitlab_runner_description }}"
    volume:
      - "{{ gitlab_runner_config_path }}:/etc/gitlab-runner{{ gitlab_runner_volume_suffix | default('') }}"
  when: not gitlab_runner_config_stat.stat.exists

- name: Ensure quadlet directory exists
  ansible.builtin.file:
    path: "{{ quadlet_dir }}"
    state: directory
    mode: "{{ quadlet_dir_mode }}"

- name: Deploy GitLab runner quadlet file
  ansible.builtin.template:
    src: gitlab_runner.container.j2
    dest: "{{ quadlet_dir }}/{{ gitlab_runner_container_name }}.container"
    mode: "{{ quadlet_file_mode }}"
  register: runner_quadlet_deployed

- name: Reload systemd daemon to recognize quadlet
  ansible.builtin.systemd_service:
    daemon_reload: true

- name: Enable and start GitLab runner service via quadlet
  ansible.builtin.systemd_service:
    name: "{{ gitlab_runner_container_name }}.service"
    enabled: true
    state: started

- name: Wait for an online project runner after deployment
  block:
    - name: Wait for an online project runner after deployment
      ansible.builtin.uri:
        url: "{{ gitlab_external_url_computed }}/api/v4/projects/{{ gitlab_project_id }}/runners"
        method: GET
        headers:
          PRIVATE-TOKEN: "{{ gitlab_root_token }}"
        validate_certs: false
        status_code: "{{ gitlab_default_status_codes.project_runners_list }}"
      register: gitlab_project_runners_online
      retries: "{{ gitlab_runner_online_check_retries }}"
      delay: "{{ gitlab_runner_online_check_delay }}"
      until: >-
        (
          gitlab_project_runners_online.json
          | selectattr('status', 'equalto', 'online')
          | list
          | length
        ) > 0
      when: gitlab_runner_require_online_after_deploy | bool
      no_log: true
  rescue:
    - name: Fail with detailed error message for runner online check
      ansible.builtin.fail:
        msg: "{{ gitlab_runner_online_check_detailed_fail_msg.splitlines() | join(' ') }}"

- name: Fail when no online runner is assigned to project
  ansible.builtin.fail:
    msg: "{{ gitlab_runner_online_failure_msg.splitlines() | join(' ') }}"
  when:
    - gitlab_runner_require_online_after_deploy | bool
    - gitlab_project_runners_online is defined
    - >-
      (
        gitlab_project_runners_online.json
        | default([])
        | selectattr('status', 'equalto', 'online')
        | list
        | length
      ) == 0


================================================
FILE: gitlab/roles/hosted_gitlab/tasks/display_summary.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

---

- name: Display deployment information
  ansible.builtin.debug:
    msg: "{{ gitlab_deployment_complete_msg }}"


================================================
FILE: gitlab/roles/hosted_gitlab/tasks/generate_tls_certs.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

---

- name: Check if CA certificate exists
  ansible.builtin.stat:
    path: "{{ gitlab_cert_dir }}/ca.crt"
  register: _ca_cert_stat

- name: Check if CA key exists
  ansible.builtin.stat:
    path: "{{ gitlab_cert_dir }}/ca.key"
  register: _ca_key_stat

- name: Check if server certificate exists
  ansible.builtin.stat:
    path: "{{ gitlab_cert_dir }}/{{ gitlab_host }}.crt"
  register: _server_cert_stat

- name: Check if server key exists
  ansible.builtin.stat:
    path: "{{ gitlab_cert_dir }}/{{ gitlab_host }}.key"
  register: _server_key_stat

- name: Determine if certificates need to be generated
  ansible.builtin.set_fact:
    _certs_need_generation: >-
      {{
        not (_ca_cert_stat.stat.exists and _ca_key_stat.stat.exists and
             _server_cert_stat.stat.exists and _server_key_stat.stat.exists)
      }}

- name: Display certificate status
  ansible.builtin.debug:
    msg: "{{ gitlab_cert_status_msg }}"
    verbosity: 2

- name: Generate CA private key
  ansible.builtin.command: >
    openssl genrsa -out {{ gitlab_cert_dir }}/ca.key {{ gitlab_ca_key_bits }}
  args:
    creates: "{{ gitlab_cert_dir }}/ca.key"
  when: _certs_need_generation

- name: Generate CA certificate
  ansible.builtin.command: >
    openssl req -x509 -new -nodes
    -key {{ gitlab_cert_dir }}/ca.key
    -sha256 -days {{ gitlab_ca_validity_days }}
    -subj "{{ gitlab_ca_subject }}"
    -out {{ gitlab_cert_dir }}/ca.crt
  args:
    creates: "{{ gitlab_cert_dir }}/ca.crt"
  when: _certs_need_generation

- name: Write SAN config from template
  ansible.builtin.template:
    src: san.cnf.j2
    dest: "{{ gitlab_cert_dir }}/san.cnf"
    mode: '0644'
  when: _certs_need_generation

- name: Generate server key
  ansible.builtin.command: >
    openssl genrsa -out {{ gitlab_cert_dir }}/{{ gitlab_host }}.key {{ gitlab_server_key_bits }}
  args:
    creates: "{{ gitlab_cert_dir }}/{{ gitlab_host }}.key"
  when: _certs_need_generation

- name: Generate CSR
  ansible.builtin.command: >
    openssl req -new
    -key {{ gitlab_cert_dir }}/{{ gitlab_host }}.key
    -out {{ gitlab_cert_dir }}/{{ gitlab_host }}.csr
    -config {{ gitlab_cert_dir }}/san.cnf
  args:
    creates: "{{ gitlab_cert_dir }}/{{ gitlab_host }}.csr"
  when: _certs_need_generation

- name: Sign server certificate
  ansible.builtin.command: >
    openssl x509 -req
    -in {{ gitlab_cert_dir }}/{{ gitlab_host }}.csr
    -CA {{ gitlab_cert_dir }}/ca.crt
    -CAkey {{ gitlab_cert_dir }}/ca.key
    -CAcreateserial
    -out {{ gitlab_cert_dir }}/{{ gitlab_host }}.crt
    -days {{ gitlab_cert_validity_days }}
    -sha256
    -extensions req_ext
    -extfile {{ gitlab_cert_dir }}/san.cnf
  args:
    creates: "{{ gitlab_cert_dir }}/{{ gitlab_host }}.crt"
  when: _certs_need_generation

- name: Install certs to GitLab SSL dir
  ansible.builtin.copy:
    src: "{{ gitlab_cert_dir }}/{{ item.src }}"
    dest: "{{ gitlab_ssl_dir }}/{{ item.dest }}"
    remote_src: true
    mode: "{{ item.mode }}"
  loop:
    - { src: "{{ gitlab_host }}.crt", dest: "{{ gitlab_host }}.crt", mode: "0644" }
    - { src: "{{ gitlab_host }}.key", dest: "{{ gitlab_host }}.key", mode: "0600" }

- name: Copy CA to runner certs dir
  ansible.builtin.copy:
    src: "{{ gitlab_cert_dir }}/ca.crt"
    dest: "{{ gitlab_runner_config_path }}/certs/{{ gitlab_host }}.crt"
    remote_src: true
    mode: '0644'

- name: Trust CA system-wide (RHEL/CentOS)
  ansible.builtin.copy:
    src: "{{ gitlab_cert_dir }}/ca.crt"
    dest: "/etc/pki/ca-trust/source/anchors/gitlab-ca.crt"
    remote_src: true
    mode: '0644'
  when: ansible_facts['os_family'] == 'RedHat'

- name: Update CA trust
  ansible.builtin.command: update-ca-trust
  changed_when: false
  when: ansible_facts['os_family'] == 'RedHat'

- name: Display CA certificate export location
  ansible.builtin.debug:
    msg: "{{ gitlab_ca_export_msg }}"
    verbosity: 2
  when: _certs_need_generation


================================================
FILE: gitlab/roles/hosted_gitlab/tasks/install_gitlab.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

---
- name: Download repository script
  ansible.builtin.get_url:
    url: "{{ gitlab_repo_script_url }}"
    dest: "/tmp/gitlab_repo_install.sh"
    mode: '0755'

- name: Install GitLab repository
  ansible.builtin.command: /bin/bash /tmp/gitlab_repo_install.sh
  changed_when: true

- name: Install GitLab CE package
  ansible.builtin.package:
    name: "{{ gitlab_package_name }}"
    state: "{{ gitlab_package_state }}"


================================================
FILE: gitlab/roles/hosted_gitlab/tasks/install_packages.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

---
- name: Install prerequisites
  ansible.builtin.package:
    name: "{{ gitlab_hosted_prereq_packages }}"
    state: present

- name: Enable Podman socket (for runner)
  ansible.builtin.systemd:
    name: podman.socket
    enabled: true
    state: started


================================================
FILE: gitlab/roles/hosted_gitlab/tasks/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

---

- name: Validate prerequisites
  ansible.builtin.include_tasks: validate_prerequisites.yml

- name: Install system packages
  ansible.builtin.include_tasks: install_packages.yml

- name: Configure firewall
  ansible.builtin.include_tasks: configure_firewall.yml

- name: Create required directories
  ansible.builtin.include_tasks: create_directories.yml

- name: Generate TLS certificates
  ansible.builtin.include_tasks: generate_tls_certs.yml

- name: Install GitLab Omnibus RPM
  ansible.builtin.include_tasks: install_gitlab.yml

- name: Configure gitlab.rb
  ansible.builtin.include_tasks: configure_gitlab.yml

- name: Change GitLab root password
  ansible.builtin.include_tasks: root_password_change.yml

- name: Create GitLab project via API
  ansible.builtin.include_tasks: create_project.yml

- name: Create pipeline trigger
  ansible.builtin.include_tasks: create_trigger.yml

- name: Set GitLab CI/CD pipeline variables
  ansible.builtin.include_tasks: set_pipeline_variables.yml

- name: Push CI/CD files to repository
  ansible.builtin.include_tasks: push_ci_files.yml

- name: Podman login to Docker registry
  ansible.builtin.include_tasks: podman_login.yml

- name: Deploy GitLab Runner container
  ansible.builtin.include_tasks: deploy_runner.yml

- name: Display deployment summary
  ansible.builtin.include_tasks: display_summary.yml


================================================
FILE: gitlab/roles/hosted_gitlab/tasks/podman_login.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
- name: Podman login
  ansible.builtin.command: >-
    podman login docker.io
    -u {{ hostvars['localhost']['docker_username'] }}
    -p {{ hostvars['localhost']['docker_password'] }}
  changed_when: true
  register: podman_login_output
  retries: "{{ retry_count }}"
  delay: "{{ delay_time }}"
  until: podman_login_output.rc == 0
  failed_when: false
  no_log: true

- name: Podman login check
  ansible.builtin.fail:
    msg: "{{ podman_login_fail_msg }} Error: {{ podman_login_output.stderr }}"
  when: podman_login_output.rc != 0


================================================
FILE: gitlab/roles/hosted_gitlab/tasks/prereq_checks.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Install sshpass on localhost
  block:
    - name: Install sshpass package
      ansible.builtin.package:
        name: sshpass
        state: present
  rescue:
    - name: Fail with repo configuration guidance
      ansible.builtin.fail:
        msg: "{{ gitlab_sshpass_install_fail_msg }}"

- name: Load GitLab configuration inputs
  ansible.builtin.include_vars:
    file: "{{ input_project_dir }}/gitlab_config.yml"
  run_once: true

- name: Ensure gitlab_host is provided in gitlab_config.yml
  ansible.builtin.assert:
    that:
      - gitlab_host is defined
      - gitlab_host | string | length > 0
    fail_msg: "gitlab_host is not set. Provide gitlab_host in input/gitlab_config.yml"

- name: Ensure provision password is available
  ansible.builtin.assert:
    that:
      - hostvars['localhost']['provision_password'] | default('') | length > 0
    fail_msg: "Provision password not found. Run credential utility to populate provision_password."

- name: Ensure gitlab root password is available
  ansible.builtin.assert:
    that:
      - hostvars['localhost']['gitlab_root_password'] is defined
      - hostvars['localhost']['gitlab_root_password'] != ""
      - hostvars['localhost']['gitlab_root_password'] | length > 0
    fail_msg: "{{ gitlab_root_password_fail_msg }}"

- name: Load build stream configuration
  ansible.builtin.include_vars:
    file: "{{ input_project_dir }}/build_stream_config.yml"
  run_once: true

- name: Ensure build stream is enabled
  ansible.builtin.assert:
    that:
      - enable_build_stream | default(false) | bool
    fail_msg: "{{ gitlab_bs_not_enabled_fail_msg }}"

- name: Ensure build stream auth username is available
  ansible.builtin.assert:
    that:
      - hostvars['localhost']['build_stream_auth_username'] | default('') | length > 0
    fail_msg: "{{ gitlab_bs_auth_username_fail_msg }}"

- name: Ensure build stream auth password is available
  ansible.builtin.assert:
    that:
      - hostvars['localhost']['build_stream_auth_password'] | default('') | length > 0
    fail_msg: "{{ gitlab_bs_auth_password_fail_msg }}"

- name: Ensure build stream host IP is provided
  ansible.builtin.fail:
    msg: "{{ gitlab_bs_host_ip_fail_msg }}"
  when: (build_stream_host_ip | default('', true) | trim | length) == 0

- name: Register GitLab SSH credentials
  ansible.builtin.add_host:
    name: "{{ gitlab_host }}"
    groups: gitlab_server
    ansible_host: "{{ gitlab_host }}"
    ansible_user: "{{ gitlab_ansible_user | default('root') }}"
    ansible_password: "{{ hostvars['localhost']['provision_password'] }}"
    ansible_ssh_common_args: "-o StrictHostKeyChecking=no"
  no_log: true


================================================
FILE: gitlab/roles/hosted_gitlab/tasks/push_ci_files.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

---
- name: Set hosted GitLab payload defaults
  ansible.builtin.set_fact:
    gitlab_hosted_payload_dir: "{{ gitlab_hosted_payload_dir | default('/tmp/omnia_gitlab_payloads') }}"
    gitlab_hosted_ci_pipeline_path: "{{ gitlab_hosted_ci_pipeline_path | default((gitlab_hosted_payload_dir | default('/tmp/omnia_gitlab_payloads')) + '/.gitlab-ci.yml') }}"  # noqa: yaml[line-length]

- name: Set catalog payload path
  ansible.builtin.set_fact:
    gitlab_hosted_catalog_path: "{{ gitlab_hosted_catalog_path | default(gitlab_hosted_payload_dir + '/' + gitlab_catalog_repo_path) }}"

- name: Check if catalog JSON exists in repository
  ansible.builtin.uri:
    url: "{{ gitlab_external_url_computed }}/api/v4/projects/{{ gitlab_project_id }}/repository/files/{{ gitlab_catalog_repo_path | urlencode }}?ref={{ gitlab_default_branch }}"  # noqa: yaml[line-length]
    method: GET
    headers:
      PRIVATE-TOKEN: "{{ gitlab_root_token }}"
    status_code: [200, 404]
    validate_certs: false
  register: catalog_file_check
  no_log: true

- name: Check if .gitlab-ci.yml exists in repository
  ansible.builtin.uri:
    url: "{{ gitlab_external_url_computed }}/api/v4/projects/{{ gitlab_project_id }}/repository/files/.gitlab-ci.yml?ref={{ gitlab_default_branch }}"
    method: GET
    headers:
      PRIVATE-TOKEN: "{{ gitlab_root_token }}"
    status_code: [200, 404]
    validate_certs: false
  register: ci_file_check
  no_log: true

- name: Ensure payload directory exists on GitLab host
  ansible.builtin.file:
    path: "{{ gitlab_hosted_payload_dir }}"
    state: directory
    mode: '0755'

- name: Create catalog JSON when missing
  when: catalog_file_check.status == 404
  block:
    - name: Copy catalog JSON to GitLab host
      ansible.builtin.copy:
        src: "{{ gitlab_catalog_json_source }}"
        dest: "{{ gitlab_hosted_catalog_path }}"
        mode: '0644'

    - name: Read catalog JSON from GitLab host
      ansible.builtin.slurp:
        src: "{{ gitlab_hosted_catalog_path }}"
      register: hosted_catalog_json_content

    - name: Create catalog JSON in repository
      ansible.builtin.uri:
        url: "{{ gitlab_external_url_computed }}/api/v4/projects/{{ gitlab_project_id }}/repository/files/{{ gitlab_catalog_repo_path | urlencode }}"  # noqa: yaml[line-length]
        method: POST
        headers:
          PRIVATE-TOKEN: "{{ gitlab_root_token }}"
        body_format: json
        body:
          branch: "{{ gitlab_default_branch }}"
          encoding: base64
          content: "{{ hosted_catalog_json_content.content }}"
          commit_message: "Add catalog_rhel.json"
        status_code: [200, 201]
        validate_certs: false

- name: Create .gitlab-ci.yml when missing
  when: ci_file_check.status == 404
  block:
    - name: Copy .gitlab-ci.yml to GitLab host
      ansible.builtin.copy:
        src: "{{ role_path }}/files/.gitlab-ci.yml"
        dest: "{{ gitlab_hosted_ci_pipeline_path }}"
        mode: '0644'

    - name: Read .gitlab-ci.yml from GitLab host
      ansible.builtin.slurp:
        src: "{{ gitlab_hosted_ci_pipeline_path }}"
      register: hosted_ci_file_content

    - name: Create .gitlab-ci.yml in repository
      ansible.builtin.uri:
        url: "{{ gitlab_external_url_computed }}/api/v4/projects/{{ gitlab_project_id }}/repository/files/.gitlab-ci.yml"  # noqa: yaml[line-length]
        method: POST
        headers:
          PRIVATE-TOKEN: "{{ gitlab_root_token }}"
        body_format: json
        body:
          branch: "{{ gitlab_default_branch }}"
          encoding: base64
          content: "{{ hosted_ci_file_content.content }}"
          commit_message: "Add Omnia CI/CD pipeline configuration"
        status_code: [200, 201]
        validate_certs: false
      no_log: true


================================================
FILE: gitlab/roles/hosted_gitlab/tasks/root_password_change.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

---

# GitLab Root Password Change from Credential Utility
# Uses the password stored in omnia_config_credentials.yml

- name: Set root password from credentials
  ansible.builtin.set_fact:
    gitlab_root_password: "{{ hostvars['localhost']['gitlab_root_password'] }}"
  no_log: true

- name: Change GitLab root password
  ansible.builtin.shell: |
    gitlab-rails runner "
      user = User.find_by_username('root')
      if user
        user.password = '{{ gitlab_root_password }}'
        user.password_confirmation = '{{ gitlab_root_password }}'
        user.save!
        puts '{{ gitlab_password_change_stdout_check }}'
      else
        puts 'Root user not found'
      end
    "
  register: password_change_result
  changed_when: gitlab_password_change_stdout_check in password_change_result.stdout
  no_log: true

- name: Verify password change
  ansible.builtin.fail:
    msg: "{{ gitlab_password_change_fail_msg }}"
  when: gitlab_password_change_stdout_check not in password_change_result.stdout

- name: Clean up initial root password file
  ansible.builtin.file:
    path: "{{ gitlab_initial_root_password_path }}"
    state: absent
  no_log: true


================================================
FILE: gitlab/roles/hosted_gitlab/tasks/set_pipeline_variables.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

---

- name: Load build stream configuration from input directory
  ansible.builtin.include_vars:
    file: "{{ hostvars['localhost']['input_project_dir'] }}/build_stream_config.yml"
  delegate_to: localhost

- name: Read BSM API certificate from localhost
  ansible.builtin.slurp:
    src: "{{ gitlab_bs_cert_path }}"
  delegate_to: localhost
  register: _bs_cert_read

- name: Set pipeline variable facts
  ansible.builtin.set_fact:
    _gitlab_bsm_api_url: "https://{{ build_stream_host_ip }}:{{ build_stream_port | default('8010') }}"
    _gitlab_bs_auth_username: "{{ hostvars['localhost']['build_stream_auth_username'] | default('') }}"
    _gitlab_bs_auth_password: "{{ hostvars['localhost']['build_stream_auth_password'] | default('') }}"
    _gitlab_bs_api_cert: "{{ _bs_cert_read.content | b64decode }}"
  no_log: true

- name: Set GitLab pipeline variables for build stream auth
  ansible.builtin.uri:
    url: >-
      {{ gitlab_external_url_computed }}/api/v4/projects/{{ gitlab_project_id
      }}/variables/{{ item.key }}
    method: GET
    headers:
      PRIVATE-TOKEN: "{{ gitlab_root_token }}"
    validate_certs: false
    status_code: "{{ gitlab_pipeline_var_check_status_codes }}"
  register: _pipeline_var_check
  loop: "{{ gitlab_pipeline_bs_variables }}"
  loop_control:
    label: "{{ item.key }}"
  no_log: true

- name: Create GitLab pipeline variable when it does not exist
  ansible.builtin.uri:
    url: "{{ gitlab_external_url_computed }}/api/v4/projects/{{ gitlab_project_id }}/variables"
    method: POST
    headers:
      PRIVATE-TOKEN: "{{ gitlab_root_token }}"
    body_format: json
    body:
      key: "{{ item.item.key }}"
      value: "{{ item.item.value }}"
      variable_type: "{{ item.item.variable_type }}"
      masked: "{{ item.item.masked }}"
      protected: false
    validate_certs: false
    status_code: "{{ gitlab_pipeline_var_create_status_codes }}"
  when: item.status == 404
  loop: "{{ _pipeline_var_check.results }}"
  loop_control:
    label: "{{ item.item.key }}"
  no_log: true

- name: Update GitLab pipeline variable when it already exists
  ansible.builtin.uri:
    url: "{{ gitlab_external_url_computed }}/api/v4/projects/{{ gitlab_project_id }}/variables/{{ item.item.key }}"
    method: PUT
    headers:
      PRIVATE-TOKEN: "{{ gitlab_root_token }}"
    body_format: json
    body:
      value: "{{ item.item.value }}"
      variable_type: "{{ item.item.variable_type }}"
      masked: "{{ item.item.masked }}"
      protected: false
    validate_certs: false
    status_code: "{{ gitlab_pipeline_var_update_status_codes }}"
  when: item.status == 200
  loop: "{{ _pipeline_var_check.results }}"
  loop_control:
    label: "{{ item.item.key }}"
  no_log: true


================================================
FILE: gitlab/roles/hosted_gitlab/tasks/validate_prerequisites.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

---
- name: Validate SELinux is disabled
  ansible.builtin.assert:
    that:
      - ansible_selinux is not defined or ansible_selinux.status == 'disabled'
    fail_msg: "{{ gitlab_selinux_fail_msg }}"

- name: Check minimum memory
  ansible.builtin.shell: |
    set -o pipefail
    free -g | awk '/^Mem:/{print $2}'
  args:
    executable: /bin/bash
  register: total_memory
  changed_when: false

- name: Validate memory requirements
  ansible.builtin.assert:
    that:
      - total_memory.stdout | int >= gitlab_min_memory_gb
    fail_msg: "{{ gitlab_memory_insufficient_msg }}"

- name: Check CPU cores
  ansible.builtin.command: nproc
  register: cpu_cores
  changed_when: false

- name: Validate CPU requirements
  ansible.builtin.assert:
    that:
      - cpu_cores.stdout | int >= gitlab_min_cpu_cores
    fail_msg: "{{ gitlab_cpu_insufficient_msg }}"

- name: Check available disk space
  ansible.builtin.shell: |
    set -o pipefail
    df -BG / | awk 'NR==2{print $4}' | sed 's/G//'
  args:
    executable: /bin/bash
  register: available_disk_space
  changed_when: false

- name: Validate storage requirements
  ansible.builtin.assert:
    that:
      - available_disk_space.stdout | int >= gitlab_min_storage_gb
    fail_msg: "{{ gitlab_storage_insufficient_msg }}"

- name: Check connectivity to build stream host
  when: build_stream_host_ip is defined and build_stream_host_ip | length > 0
  ansible.builtin.command: ping -c 3 -W 2 {{ build_stream_host_ip }}
  register: build_stream_host_ping
  changed_when: false
  failed_when: false

- name: Validate build stream host connectivity
  when: build_stream_host_ip is defined and build_stream_host_ip | length > 0
  ansible.builtin.assert:
    that:
      - build_stream_host_ping.rc == 0
    fail_msg: "{{ gitlab_bs_host_connectivity_fail_msg }}"


================================================
FILE: gitlab/roles/hosted_gitlab/templates/gitlab.rb.j2
================================================
# {{ ansible_managed }}
# GitLab Omnibus configuration managed by Omnia

external_url '{{ gitlab_external_url_computed }}'
letsencrypt['enable'] = false
{% if gitlab_https_port != 443 %}
nginx['listen_port'] = {{ gitlab_https_port }}
{% endif %}
nginx['ssl_certificate'] = '{{ gitlab_ssl_dir }}/{{ gitlab_host }}.crt'
nginx['ssl_certificate_key'] = '{{ gitlab_ssl_dir }}/{{ gitlab_host }}.key'
gitlab_rails['gitlab_shell_ssh_port'] = {{ gitlab_ssh_port }}
prometheus_monitoring['enable'] = {{ 'false' if gitlab_disable_prometheus else 'true' }}
puma['worker_processes'] = {{ gitlab_puma_workers }}
sidekiq['max_concurrency'] = {{ gitlab_sidekiq_concurrency }}


================================================
FILE: gitlab/roles/hosted_gitlab/templates/gitlab_runner.container.j2
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

# ===============================================================
# GitLab Runner Quadlet Service
# Ensures runner persists across reboots
# ===============================================================
[Unit]
Description=GitLab Runner Container
After=network-online.target
Wants=network-online.target

[Container]
ContainerName={{ gitlab_runner_container_name }}
Image={{ gitlab_runner_image }}
Network=host

# Volume mounts
Volume={{ gitlab_runner_config_path }}:/etc/gitlab-runner{{ gitlab_runner_volume_suffix | default('') }}
Volume={{ podman_socket_path }}:{{ docker_socket_path }}{{ gitlab_runner_volume_suffix | default('') }}

# Pull policy
Pull=missing

[Service]
Restart={{ gitlab_restart_policy }}
TimeoutStartSec=300

[Install]
WantedBy=multi-user.target default.target


================================================
FILE: gitlab/roles/hosted_gitlab/templates/san.cnf.j2
================================================
[req]
default_bits = {{ gitlab_server_key_bits }}
prompt = no
default_md = sha256
req_extensions = req_ext
distinguished_name = dn

[dn]
CN = {{ gitlab_host }}

[req_ext]
subjectAltName = DNS:{{ gitlab_host }}{% if gitlab_host | regex_search('^(?:[0-9]{1,3}\.){3}[0-9]{1,3}$') %},IP:{{ gitlab_host }}{% endif %}{% for dns in gitlab_additional_dns_sans %},DNS:{{ dns }}{% endfor %}{% for ip in gitlab_additional_ip_sans %},IP:{{ ip }}{% endfor %}


================================================
FILE: gitlab/roles/hosted_gitlab/vars/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

---
# GitLab Omnibus paths
gitlab_rb_path: "/etc/gitlab/gitlab.rb"
gitlab_ctl_command: "gitlab-ctl"
gitlab_repo_file_path: "/etc/yum.repos.d/gitlab_gitlab-ce.repo"

# Omnibus package
gitlab_package_name: "gitlab-ce-18.8.0"
gitlab_package_state: "present"
gitlab_repo_script_url: "https://packages.gitlab.com/install/repositories/gitlab/gitlab-ce/script.rpm.sh"

# Timeouts
gitlab_startup_wait_minutes: 5
gitlab_health_check_retries: 5
gitlab_health_check_delay: 60
gitlab_api_check_retries: 10
gitlab_api_check_delay: 15
gitlab_reconfigure_async: 3600
gitlab_reconfigure_poll: 15
gitlab_reconfigure_delay: 5
gitlab_api_unreachable_msg: 'Unable to reach GitLab API at {{ gitlab_external_url_computed }}. Verify connectivity, credentials, or TLS configuration.'
gitlab_project_ci_timeout: 9000
gitlab_default_status_codes:
  project_create: [200, 201]
  project_update: [200]
  runner_create: [200, 201]
  project_runners_list: [200]
  runner_delete: [202, 204]
  project_search: [200]
  api_version: [200, 401]
gitlab_api_ready_failure_msg: 'Failed to contact {{ gitlab_external_url_computed }}/api/v4/version before timeout.'
gitlab_project_search_failure_msg: 'Failed to search for project {{ gitlab_project_name }} via GitLab API.'
gitlab_project_create_failure_msg: 'Failed to create GitLab project {{ gitlab_project_name }} via API.'
gitlab_runner_token_failure_msg: 'Failed to create GitLab runner authentication token for project {{ gitlab_project_name }}.'
gitlab_project_timeout_failure_msg: 'Failed to update CI/CD job timeout for project {{ gitlab_project_name }} via GitLab API.'
gitlab_root_token_name: "omnia-automation"
gitlab_root_token_expiry_days: 365

# Host prerequisites
gitlab_hosted_prereq_packages:
  - curl
  - policycoreutils
  - policycoreutils-python-utils
  - openssl
  - firewalld
  - podman
  - podman-docker

# GitLab system user
gitlab_system_user_name: "git"
gitlab_system_user_shell: "/bin/sh"
gitlab_system_user_home: "/var/opt/gitlab"
gitlab_system_user_create_home: false

# GitLab directories
gitlab_directories:
  - "/etc/gitlab"
  - "/var/opt/gitlab"
  - "/var/log/gitlab"
  - "/opt/gitlab"

# GitLab files
gitlab_initial_root_password_path: "/etc/gitlab/initial_root_password"
gitlab_root_token_file_path: "/root/.gitlab_root_token"

# Runner container
gitlab_runner_image: "docker.io/gitlab/gitlab-runner:v18.8.0"
gitlab_runner_default_image: "docker.io/library/alpine:3.23.3"
gitlab_runner_helper_image_registry: "registry.gitlab.com/gitlab-org/gitlab-runner/gitlab-runner-helper"
gitlab_runner_helper_image_version: "v18.8.0"
gitlab_runner_container_name: "gitlab-runner"
gitlab_restart_policy: "always"
gitlab_runner_description: "Omnia Hosted Runner"
gitlab_runner_tags: "omnia"
gitlab_runner_executor: "docker"
gitlab_runner_registration_token_path: "/etc/gitlab/runner-registration-token"
gitlab_runner_config_path: "/srv/gitlab-runner/config"
gitlab_runner_config_file: "{{ gitlab_runner_config_path }}/config.toml"
gitlab_runner_pull_policy: "if-not-present"
force_re_register_runner: false
gitlab_runner_cleanup_existing_project_runners: true
gitlab_runner_require_online_after_deploy: true
gitlab_runner_online_check_retries: 12
gitlab_runner_online_check_delay: 10
gitlab_runner_online_failure_msg: "No online runner is assigned to project {{ gitlab_project_name }} after deployment."

gitlab_runner_online_check_detailed_fail_msg: |
  Failed to detect online GitLab runner after deployment.
  This can be caused by GitLab configuration changes like:
  - GitLab port changed (current: {{ gitlab_https_port }})
  - GitLab project name/ID changed (current: {{ gitlab_project_name }})
  For any GitLab reconfiguration, you must run gitlab_cleanup.yml before re-running the gitlab playbook.

# Podman socket (Docker-compatible, used by runner)
podman_socket_path: "/run/podman/podman.sock"
docker_socket_path: "/var/run/docker.sock"

# Quadlet configuration
quadlet_dir: "/etc/containers/systemd"
quadlet_dir_mode: "0755"
quadlet_file_mode: "0644"

# Network
gitlab_ssh_port: 22

# GitLab certificate defaults
gitlab_cert_dir: "/root/gitlab-certs"
gitlab_ssl_dir: "/etc/gitlab/ssl"
gitlab_cert_validity_days: 825
gitlab_ca_validity_days: 3650
gitlab_ca_key_bits: 4096
gitlab_server_key_bits: 2048
gitlab_ca_subject: "/C=IN/ST=Karnataka/L=Bengaluru/O=Omnia/OU=IT/CN=Omnia Internal CA"
gitlab_additional_dns_sans: []
gitlab_additional_ip_sans: []

# GitLab password change messages
gitlab_password_change_stdout_check: "Password changed successfully"
gitlab_password_change_fail_msg: "Failed to change GitLab root password. Please check GitLab logs and try again."
gitlab_password_change_success_msg: "GitLab root password changed successfully!"

# Pipeline trigger and catalog defaults
gitlab_trigger_description: "Omnia Software Catalog Webhook"
gitlab_catalog_repo_path: "catalog_rhel.json"
gitlab_catalog_json_source: "{{ role_path }}/../../../examples/catalog/catalog_rhel.json"

# Pipeline CI/CD variables
gitlab_pipeline_var_check_status_codes: [200, 404]
gitlab_pipeline_var_create_status_codes: [200, 201]
gitlab_pipeline_var_update_status_codes: [200, 201]
gitlab_pipeline_bs_variables:
  - key: "GITLAB_API_TOKEN"
    value: "{{ gitlab_root_token }}"
    variable_type: "env_var"
    masked: true
  - key: "BSM_API_URL"
    value: "{{ _gitlab_bsm_api_url | default('') }}"
    variable_type: "env_var"
    masked: false
  - key: "BSM_API_USERNAME"
    value: "{{ _gitlab_bs_auth_username | default('') }}"
    variable_type: "env_var"
    masked: false
  - key: "BSM_API_PASSWORD"
    value: "{{ _gitlab_bs_auth_password | default('') }}"
    variable_type: "env_var"
    masked: true
  - key: "BSM_API_CERT"
    value: "{{ _gitlab_bs_api_cert | default('') }}"
    variable_type: "env_var"
    masked: false

gitlab_sshpass_install_fail_msg: >
  Failed to install sshpass. Ensure AppStream and BaseOS repositories
  are configured and enabled on this gitlab host before running this playbook.

gitlab_bs_not_enabled_fail_msg: >
  Build stream is not enabled. Set enable_build_stream: true in build_stream_config.yml before running prepare_oim.yml.

gitlab_bs_auth_username_fail_msg: >
  Build stream auth username is empty. Run the credential utility to populate
  build_stream_auth_username before running the GitLab playbook.

gitlab_bs_auth_password_fail_msg: >
  Build stream auth password is empty. Run the credential utility to populate
  build_stream_auth_password before running the GitLab playbook.

gitlab_bs_host_ip_fail_msg: >
  build_stream_host_ip is not set in build_stream_config.yml.
  Provide the OIM IP address in build_stream_host_ip before running the GitLab playbook.

gitlab_root_password_fail_msg: >
  GitLab root password not found. Run credential utility to populate gitlab_root_password.

gitlab_selinux_fail_msg: >
  SELinux is currently enabled. GitLab installation requires SELinux to be disabled.
  Disable SELinux and reboot the host before running this playbook.
gitlab_bs_host_connectivity_fail_msg: "Cannot reach build stream host at {{ build_stream_host_ip }}. GitLab server must be able to ping the build stream host."

gitlab_watcher_not_running_msg: >
  playbook_watcher.service is not running on OIM host {{ build_stream_host_ip }}.
  Ensure prepare_oim.yml has been successfully executed before deploying GitLab.
  Note: Build stream must be enabled in build_stream_config.yml (enable_build_stream: true) before running prepare_oim.yml.

gitlab_build_stream_not_running_msg: >
  omnia_build_stream.service is not running on OIM host {{ build_stream_host_ip }}.
  Ensure prepare_oim.yml has been successfully executed before deploying GitLab.
  Note: Build stream must be enabled in build_stream_config.yml (enable_build_stream: true) before running prepare_oim.yml.

gitlab_postgres_not_running_msg: >
  omnia_postgres.service is not running on OIM host {{ build_stream_host_ip }}.
  Ensure prepare_oim.yml has been successfully executed before deploying GitLab.
  Note: Build stream must be enabled in build_stream_config.yml (enable_build_stream: true) before running prepare_oim.yml.

gitlab_bs_cert_missing_msg: >
  Build stream SSL certificate not found at {{ gitlab_bs_cert_path }} on OIM host {{ build_stream_host_ip }}.
  Ensure prepare_oim.yml has been successfully executed and certificates are generated.
  Note: Build stream must be enabled in build_stream_config.yml (enable_build_stream: true) before running prepare_oim.yml.

gitlab_memory_insufficient_msg: >
  Insufficient memory. Required: {{ gitlab_min_memory_gb }}GB, Available: {{ total_memory.stdout }}GB.
  Please ensure the GitLab host has at least {{ gitlab_min_memory_gb }}GB of RAM.

gitlab_cpu_insufficient_msg: >
  Insufficient CPU cores. Required: {{ gitlab_min_cpu_cores }}, Available: {{ cpu_cores.stdout }}.
  Please ensure the GitLab host has at least {{ gitlab_min_cpu_cores }} CPU cores.

gitlab_storage_insufficient_msg: >
  Insufficient storage space. Required: {{ gitlab_min_storage_gb }}GB, Available: {{ available_disk_space.stdout }}GB.
  Please ensure the GitLab host has at least {{ gitlab_min_storage_gb }}GB of free disk space.

gitlab_disable_prometheus: true
gitlab_disable_grafana: true

# Podman login configuration
retry_count: "5"
delay_time: "10"
podman_login_fail_msg: >
  Podman login failed. Please ensure the podman login credentials in the input/omnia_config_credentials.yml are valid.
  If they are, this error can occur due to a pull limit issue or multiple requests. Please try running the playbook again after waiting for a while.

# Image pull configuration
gitlab_image_pull_retries: 5
gitlab_image_pull_delay: 10

# Image pull error messages
gitlab_runner_image_pull_fail_msg: >
  Failed to pull GitLab runner image '{{ gitlab_runner_image }}' after {{ gitlab_image_pull_retries }} attempts.
  Possible causes:
  - Network connectivity issues to container registry
  - Insufficient disk space for image download
  - Registry authentication issues
  - Image name or tag does not exist
  - Docker Hub pull rate limit exceeded (for anonymous users: 100 pulls per 6 hours)
  Please check network connectivity, registry access, or consider authenticating to Docker Hub.

gitlab_helper_image_pull_fail_msg: >
  Failed to pull GitLab runner helper image '{{ gitlab_runner_helper_image_resolved }}' after {{ gitlab_image_pull_retries }} attempts.
  Possible causes:
  - Network connectivity issues to GitLab registry
  - Insufficient disk space for image download
  - Registry authentication issues
  - Helper image version '{{ gitlab_runner_helper_image_version }}' may not be available
  - Docker Hub pull rate limit exceeded (for anonymous users: 100 pulls per 6 hours)
  Please check network connectivity to registry.gitlab.com or consider authenticating to Docker Hub.

gitlab_default_image_pull_fail_msg: >
  Failed to pull default CI job image '{{ gitlab_runner_default_image }}' after {{ gitlab_image_pull_retries }} attempts.
  Possible causes:
  - Network connectivity issues to container registry
  - Insufficient disk space for image download
  - Registry authentication issues
  - Image name or tag does not exist
  - Docker Hub pull rate limit exceeded (for anonymous users: 100 pulls per 6 hours)
  Please check network connectivity, registry access, or consider authenticating to Docker Hub.

# Debug messages
gitlab_ca_export_path: "{{ gitlab_cert_dir }}/ca.crt"

gitlab_cert_status_msg: |
  Certificate Status:
  - CA Certificate: {{ 'Exists' if _ca_cert_stat.stat.exists else 'Missing' }}
  - CA Key: {{ 'Exists' if _ca_key_stat.stat.exists else 'Missing' }}
  - Server Certificate: {{ 'Exists' if _server_cert_stat.stat.exists else 'Missing' }}
  - Server Key: {{ 'Exists' if _server_key_stat.stat.exists else 'Missing' }}
  - Generation Needed: {{ _certs_need_generation }}
  {% if not _certs_need_generation %}
  - Certificates will be reused (idempotent operation)
  {% endif %}

gitlab_ca_export_msg: |
   -"========================================"
   - "CA Certificate Exported"
   - "========================================"
   - ""
   - "Certificate path: {{ gitlab_ca_export_path }}"
   - ""
   - "Download this certificate and import it into your browser"
   - "to avoid 'Not Secure' warnings when accessing GitLab."
   - ""
   - "========================================"

# OIM API Server Configuration
oim_api_verify_ssl: true
gitlab_bs_cert_path: "/opt/omnia/build_stream_ssl/ssl/bs_cert.pem"

gitlab_deployment_complete_msg:
  - "============================================"
  - "   GitLab Hosted Mode Deployment Complete   "
  - "============================================"
  - ""
  - "Access URL: {{ gitlab_external_url_computed }}"
  - "SSH Port:   {{ gitlab_ssh_port }}"
  - "Username:   root"
  - "Password:   [Encrypted - Stored in {{ hostvars['localhost']['input_project_dir'] }}/omnia_config_credentials.yml]"
  - ""
  - "Project:    {{ gitlab_project_name }}"
  - "Project ID: {{ gitlab_project_id }}"
  - "Project URL: {{ gitlab_project_url }}"
  - ""
  - "Runner Auth Token: [CONFIGURED]"
  - "Trigger Token saved to: /root/.gitlab_trigger_token"
  - ""
  - "Certificates:"
  - "- CA Certificate: {{ gitlab_cert_dir }}/ca.crt"
  - "- Server Certificate: {{ gitlab_cert_dir }}/{{ gitlab_host }}.crt"
  - "- Export for Browser: {{ gitlab_ca_export_path }}"
  - "- Certificates are reused on re-run (generated only if missing)"
  - ""
  - "Service:    {{ gitlab_ctl_command }} (start|stop|status|reconfigure)"
  - "Runner:     {{ gitlab_runner_container_name }}.service (Quadlet systemd service, persists across reboots)"
  - ""
  - "IMPORTANT: For any new GitLab reconfiguration, run cleanup_gitlab.yml before running gitlab.yml"
  - ""
  - "============================================"


================================================
FILE: input/build_stream_config.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# ***********************************************************************
# BuildStreaM (BSM)) Configuration for configuring CI/CD pipeline to automate image building and deploy
# ***********************************************************************

# Mandatory: Enable or disable build stream pipeline
# Accepted values: boolean values - (true or false) or(yes or no)
# Default: false
enable_build_stream: false

# Mandatory: Build Stream API server host IP
# Accepted values: public IP address of OIM or admin IP of OIM
build_stream_host_ip: ""

# Mandatory: Build Stream API server port
# Accepted values: valid port number (1-65535) which is free
# Default: 8010
build_stream_port: 8010

# Conditional Mandatory: AArch64 inventory host IP for aarch64 builds
# Accepted values: admin IP of aarch64 host where OS is installed
# Default none - by deafult aarch64 builds will not be generated
aarch64_inventory_host_ip: ""

================================================
FILE: input/config/aarch64/rhel/10.0/additional_packages.json
================================================
{
    "additional_packages": {
        "cluster": [

        ]
    },
    "slurm_node": {
        "cluster": [

        ]
    },
    "login_node": {
        "cluster": [

        ]
    },
    "login_compiler_node": {
        "cluster": [

        ]
    }
}


================================================
FILE: input/config/aarch64/rhel/10.0/admin_debug_packages.json
================================================
{
  "admin_debug_packages": {
    "cluster": [
      {"package": "which", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "tcpdump", "type": "rpm", "repo_name": "aarch64_appstream"},
      {"package": "traceroute", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "iperf3", "type": "rpm", "repo_name": "aarch64_appstream"},
      {"package": "fping", "type": "rpm", "repo_name": "epel"},
      {"package": "dmidecode", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "hwloc", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "hwloc-libs", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "lshw", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "pciutils", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "vim-enhanced", "type": "rpm", "repo_name": "aarch64_appstream"},
      {"package": "emacs", "type": "rpm", "repo_name": "aarch64_appstream"},
      {"package": "zsh", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "openssh", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "openssh-server", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "openssh-clients", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "rsync", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "file", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "libcurl", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "tar", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "bzip2", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "man-db", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "man-pages", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "strace", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "kexec-tools", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "openssl-devel", "type": "rpm", "repo_name": "aarch64_appstream"},
      {"package": "ipmitool", "type": "rpm", "repo_name": "aarch64_appstream"},
      {"package": "gdb", "type": "rpm", "repo_name": "aarch64_appstream"},
      {"package": "gdb-gdbserver", "type": "rpm", "repo_name": "aarch64_appstream"},
      {"package": "lldb", "type": "rpm", "repo_name": "aarch64_appstream"},
      {"package": "lldb-devel", "type": "rpm", "repo_name": "aarch64_appstream"},
      {"package": "valgrind", "type": "rpm", "repo_name": "aarch64_appstream"},
      {"package": "valgrind-devel", "type": "rpm", "repo_name": "aarch64_appstream"},
      {"package": "ltrace", "type": "rpm", "repo_name": "aarch64_appstream"},
      {"package": "kernel-tools", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "perf", "type": "rpm", "repo_name": "aarch64_appstream"},
      {"package": "papi", "type": "rpm", "repo_name": "aarch64_appstream"},
      {"package": "papi-devel", "type": "rpm", "repo_name": "aarch64_appstream"},
      {"package": "papi-libs", "type": "rpm", "repo_name": "aarch64_appstream"},
      {"package": "cmake", "type": "rpm", "repo_name": "aarch64_appstream"},
      {"package": "make", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "autoconf", "type": "rpm", "repo_name": "aarch64_appstream"},
      {"package": "automake", "type": "rpm", "repo_name": "aarch64_appstream"},
      {"package": "libtool", "type": "rpm", "repo_name": "aarch64_appstream"},
      {"package": "gcc", "type": "rpm", "repo_name": "aarch64_appstream"},
      {"package": "gcc-c++", "type": "rpm", "repo_name": "aarch64_appstream"},
      {"package": "gcc-gfortran", "type": "rpm", "repo_name": "aarch64_appstream"},
      {"package": "binutils", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "binutils-devel", "type": "rpm", "repo_name": "aarch64_appstream"},
      {"package": "clustershell", "type": "rpm", "repo_name": "epel"},
      {"package": "bash-completion", "type": "rpm", "repo_name": "aarch64_baseos"}
    ]
  }
}


================================================
FILE: input/config/aarch64/rhel/10.0/default_packages.json
================================================
{
  "default_packages": {
    "cluster": [
      {"package": "systemd", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "systemd-udev", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "kernel", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "dracut", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "dracut-live", "type": "rpm", "repo_name": "aarch64_appstream"},
      {"package": "dracut-network", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "squashfs-tools", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "nfs-utils", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "nfs4-acl-tools", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "NetworkManager", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "nm-connection-editor", "type": "rpm", "repo_name": "aarch64_appstream"},
      {"package": "iproute", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "iputils", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "curl", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "bash", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "coreutils", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "grep", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "sed", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "gawk", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "findutils", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "util-linux", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "kbd", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "lsof", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "cryptsetup", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "lvm2", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "device-mapper", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "rsyslog", "type": "rpm", "repo_name": "aarch64_appstream"},
      {"package": "chrony", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "sudo", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "gzip", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "wget", "type": "rpm", "repo_name": "aarch64_appstream"},
      {"package": "cloud-init", "type": "rpm", "repo_name": "aarch64_appstream"},
      {"package": "glibc-langpack-en", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "gedit", "type": "rpm", "repo_name": "epel"},
      { "package": "docker.io/dellhpcomniaaisolution/image-build-aarch64", "tag": "1.1", "type": "image" }
    ]
  }
}


================================================
FILE: input/config/aarch64/rhel/10.0/ldms.json
================================================
{
    "ldms": {
        "cluster": [
            {"package": "python3-devel", "type": "rpm", "repo_name": "aarch64_appstream"},
            {"package": "python3-cython", "type": "rpm", "repo_name": "aarch64_codeready-builder"},
            {"package": "openssl-libs", "type": "rpm", "repo_name": "aarch64_baseos"},
            {"package": "ovis-ldms", "type": "rpm", "repo_name": "aarch64_ldms"}
        ]
    }
}


================================================
FILE: input/config/aarch64/rhel/10.0/openldap.json
================================================
{
  "openldap": {
    "cluster": [
      {"package": "openldap-clients", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "nss-pam-ldapd", "type": "rpm", "repo_name": "epel"},
      {"package": "sssd", "type": "rpm", "repo_name": "aarch64_baseos"},
      {"package": "oddjob-mkhomedir", "type": "rpm", "repo_name": "aarch64_appstream"},
      {"package": "authselect", "type": "rpm", "repo_name": "aarch64_baseos"}
    ]
  }
}


================================================
FILE: input/config/aarch64/rhel/10.0/openmpi.json
================================================
{
  "openmpi": {
    "cluster": [
      { "package": "openmpi",
        "type": "tarball",
        "url": "https://download.open-mpi.org/release/open-mpi/v{{ openmpi_version.split('.')[:2] | join('.') }}/openmpi-{{ openmpi_version }}.tar.gz"
      },
      {"package": "pmix-devel", "type": "rpm", "repo_name": "aarch64_appstream"},
      {"package": "munge-devel", "type": "rpm", "repo_name": "aarch64_codeready-builder"},
      {"package": "gcc-c++", "type": "rpm", "repo_name": "aarch64_appstream"},
      {"package": "make", "type": "rpm", "repo_name": "aarch64_baseos"}
    ]
  }
}


================================================
FILE: input/config/aarch64/rhel/10.0/slurm_custom.json
================================================
{
    "slurm_custom": {
        "cluster": [
            {"package": "munge", "type": "rpm", "repo_name": "aarch64_appstream"},
            {"package": "firewalld", "type": "rpm", "repo_name": "aarch64_baseos"},
            {"package": "python3-firewall", "type": "rpm", "repo_name": "aarch64_baseos"},
            {"package": "pmix", "type": "rpm", "repo_name": "aarch64_appstream"},
            {"package": "nvcr.io/nvidia/hpc-benchmarks", "tag": "25.09", "type": "image"},
            {"package": "apptainer", "type": "rpm", "repo_name": "epel" },
	        {"package": "doca-ofed", "type": "rpm_repo", "repo_name": "doca" }
        ]
    },
    "slurm_control_node": {
        "cluster": [
            {"package": "slurm-slurmctld", "type": "rpm", "repo_name": "aarch64_slurm_custom"},
            {"package": "slurm-slurmdbd", "type": "rpm", "repo_name": "aarch64_slurm_custom"},
            {"package": "python3-PyMySQL", "type": "rpm", "repo_name": "aarch64_appstream"},
            {"package": "mariadb-server", "type": "rpm", "repo_name": "aarch64_appstream"}
        ]
    },
    "slurm_node": {
        "cluster": [
            {"package": "slurm-slurmd", "type": "rpm", "repo_name": "aarch64_slurm_custom"},
            {"package": "slurm-pam_slurm", "type": "rpm", "repo_name": "aarch64_slurm_custom"},
            {"package": "kernel-devel", "type": "rpm", "repo_name": "aarch64_appstream"},
            {"package": "kernel-headers", "type": "rpm", "repo_name": "aarch64_appstream"},
            {"package": "cuda-run",
             "type": "iso",
             "url": "https://developer.download.nvidia.com/compute/cuda/13.0.2/local_installers/cuda_13.0.2_580.95.05_linux_sbsa.run"
            },
            {
            "package": "nvhpc_2025_2511_Linux_aarch64_cuda_13.0",
            "type": "tarball",
            "url": "https://developer.download.nvidia.com/hpc-sdk/25.11/nvhpc_2025_2511_Linux_aarch64_cuda_13.0.tar.gz"
            }
             
        ]
    },
    "login_node":{
        "cluster": [
            {"package": "slurm-slurmd", "type": "rpm", "repo_name": "aarch64_slurm_custom"},
            {"package": "slurm", "type": "rpm", "repo_name": "aarch64_slurm_custom"}
        ]
    },
    "login_compiler_node":{
        "cluster": [
            {"package": "slurm", "type": "rpm", "repo_name": "aarch64_slurm_custom"},
            {"package": "slurm-slurmd", "type": "rpm", "repo_name": "aarch64_slurm_custom"}
        ]
    }
}


================================================
FILE: input/config/aarch64/rhel/10.0/ucx.json
================================================
{
  "ucx": {
    "cluster": [
      { "package": "ucx",
        "type": "tarball",
        "url": "https://github.com/openucx/ucx/releases/download/v{{ ucx_version }}/ucx-{{ ucx_version }}.tar.gz"
      },
      {"package": "gcc-c++", "type": "rpm", "repo_name": "aarch64_appstream"},
      {"package": "make", "type": "rpm", "repo_name": "aarch64_baseos"}
    ]
  }
}


================================================
FILE: input/config/x86_64/rhel/10.0/additional_packages.json
================================================
{
    "additional_packages": {
        "cluster": [

        ]
    },
    "service_kube_control_plane_first": {
        "cluster": [

        ]
    },
    "service_kube_control_plane": {
        "cluster": [

        ]
    },
    "service_kube_node": {
        "cluster": [

        ]
    },
    "slurm_control_node": {
        "cluster": [

        ]
    },
    "slurm_node": {
        "cluster": [

        ]
    },
    "login_node": {
        "cluster": [

        ]
    },
    "login_compiler_node": {
        "cluster": [

        ]
    }
}


================================================
FILE: input/config/x86_64/rhel/10.0/admin_debug_packages.json
================================================
{
  "admin_debug_packages": {
    "cluster": [
      {"package": "which", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "tcpdump", "type": "rpm", "repo_name": "x86_64_appstream"},
      {"package": "traceroute", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "iperf3", "type": "rpm", "repo_name": "x86_64_appstream"},
      {"package": "fping", "type": "rpm", "repo_name": "epel"},
      {"package": "dmidecode", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "hwloc", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "hwloc-libs", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "lshw", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "pciutils", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "vim-enhanced", "type": "rpm", "repo_name": "x86_64_appstream"},
      {"package": "emacs", "type": "rpm", "repo_name": "x86_64_appstream"},
      {"package": "zsh", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "openssh", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "openssh-server", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "openssh-clients", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "rsync", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "file", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "libcurl", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "tar", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "bzip2", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "man-db", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "man-pages", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "strace", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "kexec-tools", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "openssl-devel", "type": "rpm", "repo_name": "x86_64_appstream"},
      {"package": "ipmitool", "type": "rpm", "repo_name": "x86_64_appstream"},
      {"package": "gdb", "type": "rpm", "repo_name": "x86_64_appstream"},
      {"package": "gdb-gdbserver", "type": "rpm", "repo_name": "x86_64_appstream"},
      {"package": "lldb", "type": "rpm", "repo_name": "x86_64_appstream"},
      {"package": "lldb-devel", "type": "rpm", "repo_name": "x86_64_appstream"},
      {"package": "valgrind", "type": "rpm", "repo_name": "x86_64_appstream"},
      {"package": "valgrind-devel", "type": "rpm", "repo_name": "x86_64_appstream"},
      {"package": "ltrace", "type": "rpm", "repo_name": "x86_64_appstream"},
      {"package": "kernel-tools", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "perf", "type": "rpm", "repo_name": "x86_64_appstream"},
      {"package": "papi", "type": "rpm", "repo_name": "x86_64_appstream"},
      {"package": "papi-devel", "type": "rpm", "repo_name": "x86_64_appstream"},
      {"package": "papi-libs", "type": "rpm", "repo_name": "x86_64_appstream"},
      {"package": "cmake", "type": "rpm", "repo_name": "x86_64_appstream"},
      {"package": "make", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "autoconf", "type": "rpm", "repo_name": "x86_64_appstream"},
      {"package": "automake", "type": "rpm", "repo_name": "x86_64_appstream"},
      {"package": "libtool", "type": "rpm", "repo_name": "x86_64_appstream"},
      {"package": "gcc", "type": "rpm", "repo_name": "x86_64_appstream"},
      {"package": "gcc-c++", "type": "rpm", "repo_name": "x86_64_appstream"},
      {"package": "gcc-gfortran", "type": "rpm", "repo_name": "x86_64_appstream"},
      {"package": "binutils", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "binutils-devel", "type": "rpm", "repo_name": "x86_64_appstream"},
      {"package": "clustershell", "type": "rpm", "repo_name": "epel"},
      {"package": "bash-completion", "type": "rpm", "repo_name": "x86_64_baseos"}
    ]
  }
}

================================================
FILE: input/config/x86_64/rhel/10.0/csi_driver_powerscale.json
================================================
{
  "csi_driver_powerscale": {
    "cluster": [
      {
        "package": "csi-powerscale",
        "url": "https://github.com/dell/csi-powerscale.git",
        "type": "git",
        "version": "v2.15.0" 
      },
      {
        "package": "external-snapshotter",
        "url": "https://github.com/kubernetes-csi/external-snapshotter.git",
        "type": "git",
        "version": "v8.3.0"
      },
      {
        "package": "helm-charts",
        "url": "https://github.com/dell/helm-charts.git",
        "type": "git",
        "version": "csi-isilon-2.15.0"
      },
      {
        "package": "quay.io/dell/container-storage-modules/csi-isilon",
        "tag": "v2.15.0",
        "type": "image"
      },
      {
        "package": "registry.k8s.io/sig-storage/csi-attacher",
        "tag": "v4.9.0", 
        "type": "image"
      },
      {
        "package": "registry.k8s.io/sig-storage/csi-provisioner",
        "tag": "v5.3.0", 
        "type": "image"
      },
      {
        "package": "registry.k8s.io/sig-storage/csi-snapshotter",
        "tag": "v8.3.0",
        "type": "image"
      },
      {
        "package": "registry.k8s.io/sig-storage/csi-resizer",
        "tag": "v1.14.0",
        "type": "image"
      },
      {
        "package": "registry.k8s.io/sig-storage/csi-node-driver-registrar",
        "tag": "v2.14.0",
        "type": "image"
      },
      {
        "package": "registry.k8s.io/sig-storage/csi-external-health-monitor-controller",
        "tag": "v0.15.0",
        "type": "image"
     },
     {
      "package": "quay.io/dell/container-storage-modules/dell-csi-replicator",
      "tag": "v1.13.0",
      "type": "image"
    },
     {
      "package": "quay.io/dell/container-storage-modules/podmon",
      "tag": "v1.14.0",
      "type": "image"
     },
      {
       "package": "quay.io/dell/container-storage-modules/csm-authorization-sidecar",
      "tag": "v2.3.0",
      "type": "image"
     },
    {
      "package": "quay.io/dell/container-storage-modules/csi-metadata-retriever",
      "tag": "v1.12.0",
      "type": "image"
    },
    {
      "package": "registry.k8s.io/sig-storage/snapshot-controller",
      "tag": "v8.3.0",
      "type": "image"
    },
    {
      "package": "docker.io/dellemc/csm-encryption",
      "tag": "v0.6.0",
      "type": "image"
     }
    ]
  }
}


================================================
FILE: input/config/x86_64/rhel/10.0/default_packages.json
================================================
{
  "default_packages": {
    "cluster": [
      {"package": "systemd", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "systemd-udev", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "kernel", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "dracut", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "dracut-live", "type": "rpm", "repo_name": "x86_64_appstream"},
      {"package": "dracut-network", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "squashfs-tools", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "nfs-utils", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "nfs4-acl-tools", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "NetworkManager", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "nm-connection-editor", "type": "rpm", "repo_name": "x86_64_appstream"},
      {"package": "iproute", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "iputils", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "curl", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "bash", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "coreutils", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "grep", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "sed", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "gawk", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "findutils", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "util-linux", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "kbd", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "lsof", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "cryptsetup", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "lvm2", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "device-mapper", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "rsyslog", "type": "rpm", "repo_name": "x86_64_appstream"},
      {"package": "chrony", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "sudo", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "gzip", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "wget", "type": "rpm", "repo_name": "x86_64_appstream"},
      {"package": "cloud-init", "type": "rpm", "repo_name": "x86_64_appstream"},
      {"package": "glibc-langpack-en", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "gedit", "type": "rpm", "repo_name": "epel"},
      {"package": "docker.io/dellhpcomniaaisolution/image-build-el10", "tag": "1.1", "type": "image" }
    ]
  }
}


================================================
FILE: input/config/x86_64/rhel/10.0/ldms.json
================================================
{
    "ldms": {
        "cluster": [
            {"package": "python3-devel", "type": "rpm", "repo_name": "x86_64_appstream"},
            {"package": "python3-cython", "type": "rpm", "repo_name": "x86_64_codeready-builder"},
            {"package": "openssl-libs", "type": "rpm", "repo_name": "x86_64_baseos"},
            {"package": "ovis-ldms", "type": "rpm", "repo_name": "x86_64_ldms"}
        ]
    }
}


================================================
FILE: input/config/x86_64/rhel/10.0/openldap.json
================================================
{
  "openldap": {
    "cluster": [
      {"package": "openldap-clients", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "nss-pam-ldapd", "type": "rpm", "repo_name": "epel"},
      {"package": "sssd", "type": "rpm", "repo_name": "x86_64_baseos"},
      {"package": "oddjob-mkhomedir", "type": "rpm", "repo_name": "x86_64_appstream"},
      {"package": "authselect", "type": "rpm", "repo_name": "x86_64_baseos"}
    ]
  }
}


================================================
FILE: input/config/x86_64/rhel/10.0/openmpi.json
================================================
{
  "openmpi": {
    "cluster": [
      { "package": "openmpi",
        "type": "tarball",
        "url": "https://download.open-mpi.org/release/open-mpi/v{{ openmpi_version.split('.')[:2] | join('.') }}/openmpi-{{ openmpi_version }}.tar.gz"
      },
      {"package": "pmix-devel", "type": "rpm", "repo_name": "x86_64_appstream"},
      {"package": "munge-devel", "type": "rpm", "repo_name": "x86_64_codeready-builder"},
      {"package": "gcc-c++", "type": "rpm", "repo_name": "x86_64_appstream"},
      {"package": "make", "type": "rpm", "repo_name": "x86_64_baseos"}
    ]
  }
}


================================================
FILE: input/config/x86_64/rhel/10.0/service_k8s.json
================================================
{
  "service_k8s": {
    "cluster": [
      { "package": "docker.io/library/busybox", "type": "image", "tag": "1.36" },
      { "package": "firewalld", "type": "rpm", "repo_name": "x86_64_baseos" },
      { "package": "python3-firewall", "type": "rpm", "repo_name": "x86_64_baseos" },      
      { "package": "git", "type": "rpm", "repo_name": "x86_64_appstream"},
      { "package": "vim-enhanced", "type": "rpm", "repo_name": "x86_64_appstream"},
      { "package": "fuse-overlayfs", "type": "rpm", "repo_name": "x86_64_appstream"},
      { "package": "podman", "type": "rpm", "repo_name": "x86_64_appstream"},
      { "package": "kubeadm-1.34.1", "type": "rpm", "repo_name": "kubernetes"},
      { "package": "kubelet-1.34.1", "type": "rpm", "repo_name": "kubernetes"},
      { "package": "container-selinux", "type": "rpm", "repo_name": "x86_64_appstream"},
      { "package": "cri-o-1.34.1", "type": "rpm", "repo_name": "cri-o"},
      { "package": "docker.io/victoriametrics/victoria-metrics", "type": "image", "tag": "v1.128.0" },
      { "package": "docker.io/victoriametrics/vmagent", "type": "image", "tag": "v1.128.0" },
      { "package": "docker.io/victoriametrics/vmstorage", "type": "image", "tag": "v1.128.0-cluster" },
      { "package": "docker.io/victoriametrics/vminsert", "type": "image", "tag": "v1.128.0-cluster" },
      { "package": "docker.io/victoriametrics/vmselect", "type": "image", "tag": "v1.128.0-cluster" },
      { "package": "docker.io/alpine/kubectl", "tag": "1.34.1", "type": "image" },
      { "package": "docker.io/curlimages/curl", "type": "image", "tag": "8.17.0" },
      { "package": "docker.io/rmohr/activemq", "type": "image", "tag": "5.15.9" },
      { "package": "docker.io/library/mysql", "type": "image", "tag": "9.3.0" },
      { "package": "docker.io/dellhpcomniaaisolution/idrac_telemetry_receiver", "type": "image", "tag": "1.2" },
      { "package": "docker.io/dellhpcomniaaisolution/kafkapump", "type": "image", "tag": "1.2" },
      { "package": "docker.io/dellhpcomniaaisolution/victoriapump", "type": "image", "tag": "1.2" },
      { "package": "cryptography==45.0.7", "type": "pip_module" },
      { "package": "omsdk==1.2.518", "type": "pip_module" },
      { "package": "cffi==1.17.1", "type": "pip_module" },
      { "package": "quay.io/strimzi/operator", "tag": "0.48.0", "type": "image" },
      { "package": "quay.io/strimzi/kafka", "tag": "0.48.0-kafka-4.1.0", "type": "image" },
      { "package": "docker.io/dellhpcomniaaisolution/ubuntu-ldms", "tag": "1.0", "type": "image" }, 
      { "package": "strimzi-kafka-operator-helm-3-chart-0.48.0", "type": "tarball", "url": "https://github.com/strimzi/strimzi-kafka-operator/releases/download/0.48.0/strimzi-kafka-operator-helm-3-chart-0.48.0.tgz" },
      { "package": "quay.io/strimzi/kafka-bridge", "tag": "0.33.1", "type": "image" },
      { "package": "apptainer", "type": "rpm", "repo_name": "epel" },
	  { "package": "doca-ofed", "type": "rpm_repo", "repo_name": "doca" }
    ]
  },
  "service_kube_control_plane": {
    "cluster": [
      { "package": "ghcr.io/kube-vip/kube-vip", "tag": "v0.8.9", "type": "image" },
      { "package": "docker.io/alpine/kubectl", "tag": "1.34.1", "type": "image" },
      { "package": "registry.k8s.io/kube-apiserver", "tag": "v1.34.1", "type": "image" },
      { "package": "registry.k8s.io/kube-controller-manager", "tag": "v1.34.1", "type": "image" },
      { "package": "registry.k8s.io/kube-scheduler", "tag": "v1.34.1", "type": "image" },
      { "package": "registry.k8s.io/kube-proxy", "tag": "v1.34.1", "type": "image" },
      { "package": "registry.k8s.io/coredns/coredns", "tag": "v1.12.1", "type": "image" },
      { "package": "registry.k8s.io/pause", "tag": "3.10.1", "type": "image" },
      { "package": "registry.k8s.io/etcd", "tag": "3.6.4-0", "type": "image" },
      { "package": "docker.io/calico/cni", "tag": "v3.30.3", "type": "image" },
      { "package": "docker.io/calico/kube-controllers", "tag": "v3.30.3", "type": "image" },
      { "package": "docker.io/calico/node", "tag": "v3.30.3", "type": "image" },
      { "package": "quay.io/metallb/speaker", "tag": "v0.15.2", "type": "image" },
      { "package": "kubectl-1.34.1", "type": "rpm", "repo_name": "kubernetes"},
      { "package": "prettytable==3.14.0", "type": "pip_module" },
      { "package": "python3-3.12.9", "type": "rpm", "repo_name": "x86_64_baseos" },
      { "package": "git", "type": "rpm", "repo_name": "x86_64_appstream"},
      { "package": "kubernetes==33.1.0", "type": "pip_module" },
      { "package": "PyMySQL==1.1.2", "type": "pip_module" }

    ]
  },
  "service_kube_control_plane_first": {
    "cluster": [
      { "package": "ghcr.io/kube-vip/kube-vip", "tag": "v0.8.9", "type": "image" },
      { "package": "registry.k8s.io/kube-apiserver", "tag": "v1.34.1", "type": "image" },
      { "package": "registry.k8s.io/kube-controller-manager", "tag": "v1.34.1", "type": "image" },
      { "package": "registry.k8s.io/kube-scheduler", "tag": "v1.34.1", "type": "image" },
      { "package": "registry.k8s.io/kube-proxy", "tag": "v1.34.1", "type": "image" },
      { "package": "registry.k8s.io/coredns/coredns", "tag": "v1.12.1", "type": "image" },
      { "package": "docker.io/alpine/kubectl", "tag": "1.34.1", "type": "image" },
      { "package": "registry.k8s.io/pause", "tag": "3.10.1", "type": "image" },
      { "package": "registry.k8s.io/etcd", "tag": "3.6.4-0", "type": "image" },
      { "package": "docker.io/calico/cni", "tag": "v3.30.3", "type": "image" },
      { "package": "docker.io/calico/kube-controllers", "tag": "v3.30.3", "type": "image" },
      { "package": "docker.io/calico/node", "tag": "v3.30.3", "type": "image" },
      { "package": "quay.io/metallb/speaker", "tag": "v0.15.2", "type": "image" },
      {
      "package": "calico-v3.30.3",
       "type": "manifest",
       "url": "https://raw.githubusercontent.com/projectcalico/calico/v3.30.3/manifests/calico.yaml"
      },
      {
      "package": "metallb-native-v0.15.2",
       "type": "manifest",
       "url": "https://raw.githubusercontent.com/metallb/metallb/v0.15.2/config/manifests/metallb-native.yaml"
      },     
      { "package": "helm-v3.19.0-amd64", "type": "tarball", "url": "https://get.helm.sh/helm-v3.19.0-linux-amd64.tar.gz" },
	    { "package": "nfs-subdir-external-provisioner-4.0.18", "type": "tarball", "url": "https://github.com/kubernetes-sigs/nfs-subdir-external-provisioner/releases/download/nfs-subdir-external-provisioner-4.0.18/nfs-subdir-external-provisioner-4.0.18.tgz" },
      { "package": "kubectl-1.34.1", "type": "rpm", "repo_name": "kubernetes"},
      { "package": "prettytable==3.14.0", "type": "pip_module" },
      { "package": "python3-3.12.9", "type": "rpm", "repo_name": "x86_64_baseos" },
      { "package": "git", "type": "rpm", "repo_name": "x86_64_appstream"},
      { "package": "kubernetes==33.1.0", "type": "pip_module" },
      { "package": "PyMySQL==1.1.2", "type": "pip_module" }
      
    ]
  },

  "service_kube_node": {
    "cluster": [
      { "package": "registry.k8s.io/sig-storage/nfs-subdir-external-provisioner", "tag": "v4.0.2", "type": "image" },
      { "package": "quay.io/metallb/speaker", "tag": "v0.15.2", "type": "image" },
      { "package": "quay.io/metallb/controller", "tag": "v0.15.2", "type": "image" } 
    ]
  }
}


================================================
FILE: input/config/x86_64/rhel/10.0/slurm_custom.json
================================================
{
    "slurm_custom": {
        "cluster": [
            {"package": "munge", "type": "rpm", "repo_name": "x86_64_appstream"},
            {"package": "firewalld", "type": "rpm", "repo_name": "x86_64_baseos"},
            {"package": "python3-firewall", "type": "rpm", "repo_name": "x86_64_baseos"},
            {"package": "pmix", "type": "rpm", "repo_name": "x86_64_appstream"},
            {"package": "nvcr.io/nvidia/hpc-benchmarks", "tag": "25.09", "type": "image"},
            {"package": "apptainer", "type": "rpm", "repo_name": "epel" },
            {"package": "doca-ofed", "type": "rpm_repo", "repo_name": "doca" }
        ]
    },
    "slurm_control_node": {
        "cluster": [
            {"package": "slurm-slurmctld", "type": "rpm", "repo_name": "x86_64_slurm_custom"},
            {"package": "slurm-slurmdbd", "type": "rpm", "repo_name": "x86_64_slurm_custom"},
            {"package": "python3-PyMySQL", "type": "rpm", "repo_name": "x86_64_appstream"},
            {"package": "mariadb-server", "type": "rpm", "repo_name": "x86_64_appstream"},
            {"package": "iscsi-initiator-utils", "type": "rpm", "repo_name": "x86_64_baseos"},
            {"package": "device-mapper-multipath", "type": "rpm", "repo_name": "x86_64_baseos"},
            {"package": "sg3_utils", "type": "rpm", "repo_name": "x86_64_baseos"},
            {"package": "lsscsi", "type": "rpm", "repo_name": "x86_64_baseos"}
        ]
    },
    "slurm_node": {
        "cluster": [
            {"package": "slurm-slurmd", "type": "rpm", "repo_name": "x86_64_slurm_custom"},
            {"package": "slurm-pam_slurm", "type": "rpm", "repo_name": "x86_64_slurm_custom"},
            {"package": "kernel-devel", "type": "rpm", "repo_name": "x86_64_appstream"},
            {"package": "kernel-headers", "type": "rpm", "repo_name": "x86_64_appstream"},
            {"package": "cuda-run",
             "type": "iso",
             "url": "https://developer.download.nvidia.com/compute/cuda/13.0.2/local_installers/cuda_13.0.2_580.95.05_linux.run"
            },
            {
            "package": "nvhpc_2025_2511_Linux_x86_64_cuda_13.0",
            "type": "tarball",
            "url": "https://developer.download.nvidia.com/hpc-sdk/25.11/nvhpc_2025_2511_Linux_x86_64_cuda_13.0.tar.gz"
            }
        ]
    },
    "login_node":{
        "cluster": [
            {"package": "slurm-slurmd", "type": "rpm", "repo_name": "x86_64_slurm_custom"},
            {"package": "slurm", "type": "rpm", "repo_name": "x86_64_slurm_custom"}
        ]
    },
    "login_compiler_node":{
        "cluster": [
            {"package": "slurm", "type": "rpm", "repo_name": "x86_64_slurm_custom"},
            {"package": "slurm-slurmd", "type": "rpm", "repo_name": "x86_64_slurm_custom"}
        ]
    }
}


================================================
FILE: input/config/x86_64/rhel/10.0/ucx.json
================================================
{
  "ucx": {
    "cluster": [
      { "package": "ucx",
        "type": "tarball",
        "url": "https://github.com/openucx/ucx/releases/download/v{{ ucx_version }}/ucx-{{ ucx_version }}.tar.gz"
      },
      {"package": "gcc-c++", "type": "rpm", "repo_name": "x86_64_appstream"},
      {"package": "make", "type": "rpm", "repo_name": "x86_64_baseos"}
    ]
  }
}


================================================
FILE: input/gitlab_config.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

 
# Target host for GitLab deployment/cleanup
# Fields:
#   gitlab_host: IP address of the target host where GitLab will be deployed
# Notes:
#   - This is the IP address of the server where GitLab will be installed
#   - Must be accessible from the OIM server
#   - Must be configured in build_stream/gitlab/inventory/hosts.ini
gitlab_host: ""
 
# Project settings
# Name of the GitLab project Omnia will create/manage
# Fields:
#   gitlab_project_name: Name for the GitLab project
# Notes:
#   - Default: "omnia-catalog"
#   - This project will be created automatically if it doesn't exist
gitlab_project_name: "omnia-catalog"

# Visibility options: private | internal | public
# Fields:
#   gitlab_project_visibility: Visibility options - private | internal | public
# Notes:
#   - private: Project access must be granted explicitly for each user
#   - internal: The project can be cloned by any logged in user
#   - public: The project can be cloned without any authentication
gitlab_project_visibility: "private"

# Default branch used for repository and API operations
# Fields:
#   gitlab_default_branch: Name of the default branch
# Notes:
#   - Default: "main"
#   - This branch will be used as the default for all operations
gitlab_default_branch: "main"

 
# HTTPS is always enabled for GitLab deployment 
# ----------------------------------------------------------------------------
# DEFAULT / ADVANCED VARIABLES (CHANGE ONLY IF NEEDED)
# ----------------------------------------------------------------------------
# These defaults are suitable for most setups and can be tuned as required.
 
# Network
# HTTPS port exposed via GitLab NGINX
# Fields:
#   gitlab_https_port: Port number for HTTPS access
# Notes:
#   - Default: 443
#   - Must be between 1-65535
#   - Must not conflict with other services
gitlab_https_port: 443

# Minimum requirements
# Free disk space validated before install
# Fields:
#   gitlab_min_storage_gb: Minimum storage in GB
# Notes:
#   - Default: 20
#   - GitLab requires at least 20GB of free disk space
gitlab_min_storage_gb: 20

# Adjust upward for production workloads
# Fields:
#   gitlab_min_memory_gb: Minimum memory in GB
# Notes:
#   - Default: 4
#   - Adjust upward for production workloads
gitlab_min_memory_gb: 4

# Minimum CPU core count validated before install
# Fields:
#   gitlab_min_cpu_cores: Minimum number of CPU cores
# Notes:
#   - Default: 2
#   - More cores may be needed for production workloads
gitlab_min_cpu_cores: 2
 

# Web worker count; scale with CPU
# Fields:
#   gitlab_puma_workers: Number of worker processes
# Notes:
#   - Default: 2
#   - Scale with CPU cores (recommended: 1-2 workers per CPU core)
gitlab_puma_workers: 2

# Background job concurrency
# Fields:
#   gitlab_sidekiq_concurrency: Number of concurrent background jobs
# Notes:
#   - Default: 10
#   - Adjust based on available memory and workload
 
# Target host for GitLab deployment/cleanup
gitlab_sidekiq_concurrency: 10
 

================================================
FILE: input/high_availability_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# ***********************************************************************
# High Availability (HA) Configuration for Kubernetes (K8s) Service Node(List)
# - cluster_name is required field it should match one of the values defined in omnia_config.yml where deployment is set to true.
# - enable_k8s_ha: <Mandatory> Indicates whether to enable HA for the Kubernetes (K8s) service node. Set to 'true' to enable, 'false' to disable.
# - virtual_ip_address: <Mandatory> The virtual IP address for the K8s service node setup.
# ***********************************************************************

service_k8s_cluster_ha:
  - cluster_name: service_cluster
    enable_k8s_ha: true
    virtual_ip_address: "172.16.107.1"

================================================
FILE: input/local_repo_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# You may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# ================================
# VARIABLE DETAILS
# ================================
# 1. user_registry
#--------------------------
# Configuration for user registry to configure additional images in Pulp
# Fields:
#   host       : Registry IP and port in format "IP:port"
#   cert_path  : Path to SSL certificate file (.crt) - Required only if host is using HTTPS
#   key_path   : Path to SSL private key file (.key) - Required only if host is using HTTPS
# Notes:
#   - If host is HTTPS, cert_path and key_path are required
#   - If host is HTTP, cert_path and key_path can be left empty
#   - cert_path should point to .crt files only
#   - key_path should point to .key files only
#   - cert and key paths are accessed from within the omnia_core container
# 2. user_repo_url_x86_64
#--------------------------
#    Optional list of user-defined repository URLs for x86_64 architecture.
#    Each entry can include: url, gpgkey, sslcacert, sslclientkey, sslclientcert, name, policy.
#    Used for custom cluster packages like <arch>_slurm_custom.
# Fields:
#   url         : Base URL of the repository
#   gpgkey      : GPG key URL (leave empty to disable gpgcheck; Omnia will trust this repo and user is responsible for its security)
#   name        : Name of the repository (must start with 'x86_64_', e.g., 'x86_64_my_repo')
#   sslcacert   : Path to SSL CA certificate (if using SSL)
#   sslclientkey: Path to SSL client key (if using SSL)
#   sslclientcert: Path to SSL client certificate (if using SSL)
#   policy      : Repository sync policy. Allowed values: always, partial (OPTIONAL)
#                   If not provided, uses repo_config from software_config.json
#   caching     : Enable or disable local caching. Allowed values: true, false (OPTIONAL)
#                   If not provided, defaults to true
# Notes:
#   - Do not use Jinja variables in this configuration.
#   - Omit SSL fields entirely if SSL is not in use.
#   - Its a madatory field in case of slurm_custom with name as '<arch>_slurm_custom'
#
# 3. user_repo_url_aarch64
#---------------------------
#    Same as above but for aarch64 architecture.
#    Note: name must start with 'aarch64_' (e.g., 'aarch64_my_repo').
#
# 4. rhel_os_url_x86_64
#-----------------------------
#    Mandatory when RHEL subscription is not registered.
#    Contains repository URLs for codeready-builder, baseos, and appstream for x86_64.
# Fields:
#   url         : Base URL of the repository
#   gpgkey      : GPG key URL (leave empty to disable gpgcheck; Omnia will trust this repo and user is responsible for its security)
#   sslcacert   : Path to SSL CA certificate (if using SSL)
#   sslclientkey: Path to SSL client key (if using SSL)
#   sslclientcert: Path to SSL client certificate (if using SSL)
#   policy      : Repository policy if mentioned allowed values (always, partial). 
#                   If not provided, uses repo_config from software_config.json
#   caching     : Enable or disable local caching. Allowed values: true, false (OPTIONAL)
#                   If not provided, defaults to true
#   name        : Name of the repository [ Allowed repo names <arch>_codeready-builder, <arch>_appstream, <arch>_baseos
# Notes:
#   - Do not use Jinja variables in this configuration.
#   - Omit SSL fields entirely if SSL is not in use.
#   - RHEL subscription is not registered, All 3 repositories [ <arch>_codeready-builder, <arch>_appstream, <arch>_baseos ]entries
#      are mandatory.
#
# 5. rhel_os_url_aarch64
#----------------------------
#    Same as above but for aarch64 architecture.
#
# 6. rhel_subscription_repo_config_x86_64
#-------------------------------------------
#    Optional configuration for overriding policy and caching settings for RHEL 
#    subscription-based repositories on x86_64 architecture.
#    When subscription is enabled, this config takes precedence over dynamically 
#    generated URLs for matching repositories and adds any additional repositories.
# Fields:
#   url         : Base URL of the repository (REQUIRED)
#   gpgkey      : GPG key URL (REQUIRED, can be empty to disable gpgcheck)
#   name        : Repository name for matching (REQUIRED)
#   policy      : Repository sync policy. Allowed values: always, partial (OPTIONAL)
#                   If not provided, uses repo_config from software_config.json
#   caching     : Enable or disable local caching. Allowed values: true, false (OPTIONAL)
#                   If not provided, defaults to true
#   sslcacert   : Path to SSL CA certificate (optional)
#   sslclientkey: Path to SSL client key (optional)
#   sslclientcert: Path to SSL client certificate (optional)
# Notes:
#   - Do not use Jinja variables in this configuration.
#   - Omit SSL fields entirely if SSL is not in use.
#   - Matching is done by repository name (e.g., x86_64_appstream)
#   - Non-matching repositories are added as additional repos
#
# 7. rhel_subscription_repo_config_aarch64
#--------------------------------------------
#    Same as above but for aarch64 architecture.
#
#### ADVANCE CONFIGURATIONS FOR LOCAL REPO ###
# 8. omnia_repo_url_rhel_x86_64
#-------------------------------
#    Mandatory repository URLs for downloading RPMS for Omnia features on RHEL x86_64.
#    Each entry includes url, gpgkey, and name.
#
# This variable defines all the repo urls from where rpms will be downloaded for omnia features when cluster_os_type is rhel and arch x86_64
# Making incorrect changes to this variable can cause omnia failure. Please edit cautiously.
# Fields:
#  url        : Base URL of the repository.
#  gpgkey     : URL of the GPG key for the repository.
#                   If left empty, gpgcheck=0 for that repository.
#  name       : A unique identifier for the repository or registry.
#  policy      : Repository sync policy. Allowed values: always, partial (OPTIONAL)
#                   If not provided, uses repo_config from software_config.json
#  caching     : Enable or disable local caching. Allowed values: true, false (OPTIONAL)
#                   If not provided, defaults to true
# 9. omnia_repo_url_rhel_aarch64
#--------------------------------
#    Same as above but for RHEL aarch64.
#
# 10. additional_repos_x86_64
#----------------------------
#    Optional list of additional repository URLs for x86_64 architecture.
#    These repos are aggregated into a single Pulp repository, allowing dynamic
#    addition/removal without changing compute node configurations.
# Fields:
#   url           : Base URL of the repository (required)
#   gpgkey        : GPG key URL (required, can be empty - disables gpgcheck)
#   name          : Unique name for the repository (required)
#   sslcacert     : Path to SSL CA certificate (optional)
#   sslclientkey  : Path to SSL client key (optional)
#   sslclientcert : Path to SSL client certificate (optional)
#   policy      : Repository sync policy. Allowed values: always, partial (OPTIONAL)
#                   If not provided, uses repo_config from software_config.json
#   caching     : Enable or disable local caching. Allowed values: true, false (OPTIONAL)
#                   If not provided, defaults to true
# Notes:
#   - All repos are synced into a single aggregated Pulp repository
#   - Compute nodes are configured once with a fixed URL that never changes
#   - Policy is controlled globally via repo_config in software_config.json (per-entry policy not supported)
#   - Name must be unique within this list and must not conflict with names in other repo keys
#   - Packages from these repos can only be used via additional_packages.json
#
# 11. additional_repos_aarch64
#-----------------------------
#    Same as above but for aarch64 architecture.

# ================================
# VARIABLES
# ================================
# user_registry:
#    - { host: "172.16.107.254:4000", cert_path: "/opt/omnia/domain.crt", key_path: "/opt/omnia/domain.key" }
user_registry:
# user_repo_url_x86_64:
#  - { url: "", gpgkey: "", sslcacert: "", sslclientkey: "", sslclientcert: "",  name: "x86_64_slurm_custom" }
user_repo_url_x86_64:
user_repo_url_aarch64:
#Example:
# rhel_os_url_x86_64:
#  - { url: "http://crb.com/CRB/x86_64/os/", gpgkey: "http://crb.com/CRB/x86_64/os/RPM-GPG-KEY", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "x86_64_codeready-builder"}
#  - { url: "http://BaseOS.com/BaseOS/x86_64/os/", gpgkey: "http://BaseOS.com/BaseOS/x86_64/os/RPM-GPG-KEY", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "x86_64_baseos"}
#  - { url: "http://AppStream.com/AppStream/x86_64/os/", gpgkey: "http://AppStream.com/AppStream/x86_64/os/RPM-GPG-KEY", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "x86_64_appstream" }
rhel_os_url_x86_64:
rhel_os_url_aarch64:
# Example:
# rhel_subscription_repo_config_x86_64:
#  - { url: "https://example.com/appstream", gpgkey: "", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "x86_64_appstream", policy: "always", caching: true }
#  - { url: "https://cdn.redhat.com/content/dist/rhel10/10.0/x86_64/supplementary/os/", gpgkey: "file:///etc/pki/rpm-gpg/RPM-GPG-KEY-redhat-release", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "x86_64_supplementary", policy: "always", caching: false }
rhel_subscription_repo_config_x86_64:
rhel_subscription_repo_config_aarch64:
# Making incorrect changes to this variable can cause omnia failure. Please edit cautiously.
omnia_repo_url_rhel_x86_64:
  - { url: "https://download.docker.com/linux/centos/10/x86_64/stable/", gpgkey: "https://download.docker.com/linux/centos/gpg", name: "docker-ce"}
  - { url: "https://dl.fedoraproject.org/pub/epel/10/Everything/x86_64/", gpgkey: "https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-10", name: "epel"}
  - { url: "https://pkgs.k8s.io/core:/stable:/v1.34/rpm/", gpgkey: "https://pkgs.k8s.io/core:/stable:/v1.34/rpm/repodata/repomd.xml.key", name: "kubernetes"}
  - { url: "https://download.opensuse.org/repositories/isv:/cri-o:/stable:/v1.34/rpm/", gpgkey: "https://download.opensuse.org/repositories/isv:/cri-o:/stable:/v1.34/rpm/repodata/repomd.xml.key", name: "cri-o"}
  - { url: "https://linux.mellanox.com/public/repo/doca/3.2.1/rhel10/x86_64/", gpgkey: "https://linux.mellanox.com/public/repo/doca/3.2.1/rhel10/x86_64/repodata/repomd.xml.key", name: "doca"}
omnia_repo_url_rhel_aarch64:
  - { url: "https://download.docker.com/linux/centos/10/aarch64/stable/", gpgkey: "https://download.docker.com/linux/centos/gpg", name: "docker-ce"}
  - { url: "https://dl.fedoraproject.org/pub/epel/10/Everything/aarch64/", gpgkey: "https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-10", name: "epel"}
  - { url: "https://linux.mellanox.com/public/repo/doca/3.2.1/rhel10/arm64-sbsa/", gpgkey: "https://linux.mellanox.com/public/repo/doca/3.2.1/rhel10/arm64-sbsa/repodata/repomd.xml.key", name: "doca"}
# Example:
# additional_repos_x86_64:
#  - { url: "https://rpm.grafana.com/", gpgkey: "", name: "grafana" }
#  - { url: "https://repo.example.com/x86_64/", gpgkey: "", name: "custom-repo", sslcacert: "/path/ca.crt", sslclientkey: "/path/client.key", sslclientcert: "/path/client.crt" }
additional_repos_x86_64:
additional_repos_aarch64:


================================================
FILE: input/network_spec.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# This file is used to specify the network configuration.
#
# 'admin_network' is a mandatory field, essential for PXE boot and host communication."
#
# The 'admin_network' section contains the following variables:
# - 'oim_nic_name': The name of the interface on the OIM server associated with the admin network.
# - 'netmask_bits': The number of bits in the subnet mask.
# - 'primary_oim_admin_ip': The admin IP address of the OIM server which is configured.
# - 'primary_oim_bmc_ip': The iDRAC  IP address of the OIM server,
#     Mandatory only if idrac_telemetry is set to true and telemetry data needs to be collected from the OIM server.
#     Optional — can be omitted if iDRAC telemetry for the OIM server is not required.
# - 'dynamic_range': The range of dynamic IP addresses available on the admin network.
# - 'dns': The list of external DNS server IP address for the admin network.
# - 'ntp_servers': The list of NTP servers for the admin network. Each NTP server entry should include: 
#     - 'address': The IP address or hostname of the NTP server.
#     - 'type': The type of NTP entry, either 'server' or 'pool'.
#     Example:  
#     ntp_servers:
#       - { address: "172.16.10.80", type: "server" }

# 'ib_network' is a mandatory field, essential for IB network configuration.
# The 'ib_network' section contains the following variables:
# - 'subnet': The subnet of the IB network.
# - 'netmask_bits': The number of bits in the subnet mask. This value must be same as the admin_network netmask_bits.


Networks:
- admin_network:
    oim_nic_name: "eno1"
    netmask_bits: "24"
    primary_oim_admin_ip: "172.16.107.254"
    primary_oim_bmc_ip: "" 
    dynamic_range: "172.16.107.201-172.16.107.250"
    dns: []
    ntp_servers: []

- ib_network:
    subnet: "192.168.0.0"
    netmask_bits: "24"


================================================
FILE: input/omnia_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# -----------------------------SLURM------------------------------------------------
# slurm_cluster
# List of slurm clusters
# cluster_name is required field

# nfs_storage_name
# Storage name corresponding to the NFS share to be used by slurm cluster 
# This should match with exactly with a entry in storage_config.yml

# skip_merge
# Variable indicates whether a specific configuration file path
# under config_sources should be used as-is without merging
# If skip_merge is set to true for a configuration source path,
# that configuration file will be applied directly
# without merging with defaults or existing configurations
# It accepts true and false values
# Default value is false

# node_discovery_mode
# Controls how hardware specifications are discovered for Slurm compute nodes
# Options: "heterogeneous" or "homogeneous"
# - heterogeneous: Discovers each node individually via iDRAC (1 call per node)
#   Best for: Mixed hardware environments with different node configurations
# - homogeneous: Groups nodes by hardware type for optimized discovery
#   Best for: Standardized hardware groups (grp0-grp100 in pxe_mapping_file.csv)
#   Performance: 0 iDRAC calls (with specs) or 1 call per group (without specs)
# Default value is heterogeneous

# node_hardware_defaults
# Optional: Pre-define hardware specifications for homogeneous node groups
# Only used when node_discovery_mode is set to "homogeneous"
# Key: GROUP_NAME from pxe_mapping_file.csv (e.g., grp0, grp1, grp2, etc.)
# Value: Hardware specifications for all nodes in that group
#   - sockets: Number of CPU sockets per node (integer, minimum 1)
#   - cores_per_socket: Number of CPU cores per socket (integer, minimum 1)
#   - threads_per_core: Number of CPU threads per core (integer, minimum 1)
#   - real_memory: Memory in MB (integer, minimum 1)
#   - gres: Optional GPU resources in format "gpu:N" (e.g., "gpu:4")
# If a group is not listed here, one node from that group will be discovered via iDRAC
# and the specs will be applied to all nodes in the group
# Example:
#   node_hardware_defaults:
#     grp1:
#       sockets: 2
#       cores_per_socket: 64
#       threads_per_core: 2
#       real_memory: 512000
#       gres: "gpu:4"
#     grp2:
#       sockets: 2
#       cores_per_socket: 32
#       threads_per_core: 2
#       real_memory: 256000

# config_sources
# defines how the Slurm configuration files are provided to the cluster.
# <conf name>: 
#    <mapping> or <filepath>
# <mapping> Supply the configuration values directly as a key–value map
# <filepath> Supply the absolute path to a custom configuration file
#            This path can be any path inside the omnia_core container.
#            The default input path "/opt/omnia/input/project_default" 
#            can also be used to place the custom conf files
# The conf files supported by slurm are
# slurm
# cgroup
# slurmdbd
# gres
# acct_gather
# helpers
# job_container
# mpi
# oci
# topology
# burst_buffer
# Thes files will be written into the slurm_config directory with .conf suffix

slurm_cluster:
  - cluster_name: slurm_cluster
    nfs_storage_name: nfs_slurm
    # skip_merge: true
    
    # Uncomment to enable homogeneous discovery mode
    # node_discovery_mode: "homogeneous"
    
    # Uncomment to provide hardware specs for homogeneous groups
    # node_hardware_defaults:
    #   grp1:
    #     sockets: 2
    #     cores_per_socket: 64
    #     threads_per_core: 2
    #     real_memory: 512000
    #     gres: "gpu:4"
    #   grp2:
    #     sockets: 2
    #     cores_per_socket: 32
    #     threads_per_core: 2
    #     real_memory: 256000
    
    # config_sources:
    #   slurm:
    #     SlurmctldTimeout: 60
    #     SlurmdTimeout: 150
    #     NodeName:
    #       - NodeName: newnode1
    #         CPUs: 16
    #         RealMemory: 64000
    #       - NodeName: newnode2
    #         CPUs: 16
    #         RealMemory: 64000
    #   cgroup:
    #     CgroupPlugin: autodetect
    #     ConstrainCores: True
    #     ConstrainDevices: True
    #     ConstrainRAMSpace: True
    #     ConstrainSwapSpace: True

    #   OR
  
    # config_sources:
    #   slurm: /opt/omnia/input/project_default/slurm.conf
    #   cgroup: /opt/omnia/input/project_default/cgroup.conf
    #   slurmdbd: /opt/omnia/input/project_default/slurmdbd.conf
  
# ----------------------------SERVICE K8S------------------------------------------------------
# For service k8s cluster below parameters are required,(List)
# - cluster_name is required field

# - deployment: Exactly one entry in both the service_k8s_cluster lists must have deployment set to true to indicate where Kubernetes should be deployed.
# Please ensure corresponding cluster entry is added to high_availability_config.yml if deployment is set to true. 

# - Kubernetes SDN network.K8s_cni (Mandatory) - It can either be "calico" or "flannel".Default value assigned is "calico".
# While setting up Kubernetes plugin for RoCE NIC, ensure that this value is set to "flannel"

# - pod_external_ip_range: (Mandatory) These addresses will be used by Loadbalancer for assigning External IPs to K8s services
# Make sure the IP range is not assigned to any node in the cluster.
# Acceptable formats: "10.11.0.100-10.11.0.150" , "10.11.0.0/16"

# - k8s_service_addresses: Kubernetes internal network for services.This network must be unused in your network infrastructure.
# Default value is "10.233.0.0/18"

# - k8s_pod_network_cidr: Kubernetes pod network CIDR for internal network. When used, it will assign IP addresses from this range to individual pods.
# This network must be unused in your network infrastructure.
# Default value is "10.233.64.0/18"

# nfs_storage_name : The nfs name should be same as one of the nfs name defined in storage_config.yml to configure the server.
# ----------------------------CSI Driver------------------------------------------------------
# Following csi powerscale driver input variables are mandatory only if csi_driver_powerscale entry is present in software_config.json
# csi_powerscale_driver_secret_file_path: Absolute file path for the secret.yaml file.
# User need to download secret.yaml file and fill required data in secret file. Provided the path of the secret file here.
# File path for the values.yml file which will contain the Powerscale driver configuration parameters.
# csi_powerscale_driver_values_file_path: User need to download values.yaml file and fill required data in values.yaml file. Provided the path of the values.yaml file here.
# mention configurable values

# - k8s_crio_storage_size: Specifies the disk size allocated for CRI-O container storage.
# This storage is used to store container images, writable layers, and runtime data.
# Acceptable formats: "10G", "15G", "50G" (Only positive values in Gigabytes are allowed)
# Default value is "20G"


service_k8s_cluster:
  - cluster_name: service_cluster
    deployment: true
    k8s_cni: "calico"
    pod_external_ip_range: "172.16.107.170-172.16.107.200"
    k8s_service_addresses: "10.233.0.0/18"
    k8s_pod_network_cidr: "10.233.64.0/18"
    nfs_storage_name: "nfs_k8s"
    csi_powerscale_driver_secret_file_path: ""
    csi_powerscale_driver_values_file_path: ""
    k8s_crio_storage_size: "20G"


================================================
FILE: input/provision_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

#### Mandatory
# This depicts the path where user has kept the PXE mapping file.
# The mapping file consists of the Service tag, Admin MAC,Hostname and its respective admin IP address and/or BMC IP.
# Ensure that admin IPs given in mapping file are within the network defined in the network_spec.yml
# A templates for mapping file exists in omnia/examples, namely, pxe_mapping_file.csv
# Format of csv: FUNCTIONAL_GROUP_NAME,GROUP_NAME,SERVICE_TAG,HOSTNAME,ADMIN_MAC,ADMIN_IP,BMC_MAC,BMC_IP
pxe_mapping_file_path: "/opt/omnia/input/project_default/pxe_mapping_file.csv"

#### Mandatory
# Language that needs to be set during OS provisioning.
# Only language supported is "en_US.UTF-8"
language: "en_US.UTF-8"

#### Mandatory
# Default lease time needs to be used by DHCP
# Unit: seconds
# Min: 21600
# Default: 86400
# Max: 31536000
default_lease_time: "86400"


================================================
FILE: input/pxe_mapping_file.csv
================================================
FUNCTIONAL_GROUP_NAME,GROUP_NAME,SERVICE_TAG,PARENT_SERVICE_TAG,HOSTNAME,ADMIN_MAC,ADMIN_IP,BMC_MAC,BMC_IP
slurm_control_node_x86_64,grp0,ABCD12,,slurm-control-node1,xx:yy:zz:aa:bb:cc,172.16.107.52,xx:yy:zz:aa:bb:dd,172.17.107.52
slurm_node_aarch64,grp1,ABCD34,ABFL82,slurm-node1,aa:bb:cc:dd:ee:ff,172.16.107.43,aa:bb:cc:dd:ee:gg,172.17.107.43
slurm_node_aarch64,grp2,ABFG34,ABKD88,slurm-node2,aa:bb:cc:dd:ee:ff,172.16.107.44,aa:bb:cc:dd:ff:gg,172.17.107.44
login_compiler_node_aarch64,grp8,ABCD78,,login-compiler-node1,aa:bb:cc:dd:ee:gg,172.16.107.41,aa:bb:cc:dd:ee:bb,172.17.107.41
login_node_x86_64,grp9,ABFG78,,login-node1,aa:bb:cc:dd:ee:gg,172.16.107.42,aa:bb:cc:dd:ee:bb,172.17.107.42
service_kube_control_plane_x86_64,grp3,ABFG79,,service-kube-control-plane1,aa:bb:cc:dd:ee:ff,172.16.107.53,xx:yy:zz:aa:bb:ff,172.17.107.53
service_kube_control_plane_x86_64,grp4,ABFH78,,service-kube-control-plane2,aa:bb:cc:dd:ee:hh,172.16.107.54,xx:yy:zz:aa:bb:hh,172.17.107.54
service_kube_control_plane_x86_64,grp4,ABFH80,,service-kube-control-plane3,aa:bb:cc:dd:ee:ii,172.16.107.55,xx:yy:zz:aa:bb:ii,172.17.107.55
service_kube_node_x86_64,grp5,ABFL82,,service-kube-node1,aa:bb:cc:dd:ee:jj,172.16.107.56,xx:yy:zz:aa:bb:jj,172.17.107.56
service_kube_node_x86_64,grp5,ABKD88,,service-kube-node2,aa:bb:cc:dd:ee:kk,172.16.107.57,xx:yy:zz:aa:bb:ff,172.17.107.57


================================================
FILE: input/security_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# Connection Type options: TLS or SSL
# Default: TLS (validated)
# If TLS: secure OpenLDAP connection occurs on port 389
# If SSL: secure OpenLDAP connection occurs on port 636
ldap_connection_type: "TLS"


================================================
FILE: input/software_config.json
================================================
{
    "cluster_os_type": "rhel",
    "cluster_os_version": "10.0",
    "repo_config": "partial",
    "softwares": [
        {"name": "default_packages", "arch": ["x86_64","aarch64"]},
        {"name": "admin_debug_packages", "arch": ["x86_64","aarch64"]},
        {"name": "openldap", "arch": ["x86_64","aarch64"]},
        {"name": "service_k8s","version": "1.34.1", "arch": ["x86_64"]},
        {"name": "slurm_custom", "arch": ["x86_64","aarch64"]},
        {"name": "csi_driver_powerscale", "version":"v2.15.0", "arch": ["x86_64"]},
        {"name": "ldms", "arch": ["x86_64","aarch64"]},
        {"name": "additional_packages", "arch": ["x86_64","aarch64"]}
    ],
    "slurm_custom": [
        {"name": "slurm_control_node"},
        {"name": "slurm_node"},
        {"name": "login_node"},
        {"name": "login_compiler_node"}
    ],
    "service_k8s": [
        {"name": "service_kube_control_plane_first"},
        {"name": "service_kube_control_plane"},
        {"name": "service_kube_node"}
    ],
    "additional_packages":[
        {"name": "service_kube_control_plane_first"},
        {"name": "service_kube_control_plane"},
        {"name": "service_kube_node"},
        {"name": "slurm_control_node"},
        {"name": "slurm_node"},
        {"name": "login_node"},
        {"name": "login_compiler_node"}
    ]

}


================================================
FILE: input/storage_config.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# -----------------------------Powervault-------------------------------------------
# powervault_config
# Mandatory when using PowerVault for persistent storage.
# Below parameters are mandatory when powervault_config is defined
    # ip: A list of PowerVault controller ipv4 addresses used for iSCSI target discovery and login.
    # iscsi_initiator: Specifies the InitiatorName used by the host when connecting to the iSCSI target. This IQN uniquely identifies the host to the storage array.
    # volume_id: This is the unique WWN/identifier for the specific volume that should be used for persistent storage. This value is used for multipath scanning to select the correct mapped device.

# Below are the optional parameters when powervault_config is defined
    # port: Defines the TCP port for the iSCSI target service. When port is not specified, default port used will be 3260

# Below is an example on how to configure powervault_config
# In this configuration, a single controller portal is provided.

#powervault_config:
#  ip:
#    - 172.1.2.3
#  port: 3260
#  iscsi_initiator: iqn.2025-01.com.dell:scontrol-node
#  volume_id: 00c0ff4343f1f1f1001c8c4e6901000000


# -----------------------------NFS------------------------------------------------

# This variable is used for mounting NFS share on slurm_control_node, slurm_node, login_node
# This takes a list of dicts with possible keys server_ip, server_share_path, client_share_path, client_mount_options
# In both the cases, the USER must manually update 'server_ip' and 'server_share_path' below with the correct values.
# If mount_option values are empty, NFS client will be mounted with these values "nosuid,rw,sync,hard,intr"
# Its mandatory to provide atleast one entry in nfs_client_params
# Example for single mount file system:
# nfs_client_params:
# nfs_name : str ,Name of the NFS storage resource. The default is "nfs_storage_default".
#     The user can assign any custom string to specify a different NFS storage resource.
# - { server_ip: 10.5.0.101, server_share_path: "/mnt/share", client_share_path: "/home", client_mount_options: "nosuid,rw,sync,hard"}
# Example for supporting multiple mount points:
# nfs_client_params:
# - { server_ip: 198.168.0.1,server_share_path: "/mnt/share1", client_share_path: "/home", client_mount_options: "nosuid,rw,sync,hard"}
# - { server_ip: 198.168.0.2, server_share_path: "/mnt/share2", client_share_path: "/mnt/mount2", client_mount_options: "nosuid,rw,sync,hard"}
# Example for multiple mount file system:
# nfs_client_params:
# - { server_ip: 198.168.0.1, server_share_path: "/mnt/share1", client_share_path: "/mnt/mount1", client_mount_options: "nosuid,rw,sync,hard"}
# - { server_ip: 198.168.0.2, server_share_path: "/mnt/share2", client_share_path: "/mnt/mount2", client_mount_options: "nosuid,rw,sync,hard"}
nfs_client_params:
  - server_ip: "172.16.107.168" # Provide the IP of the NFS server
    server_share_path: "/mnt/share/omnia" # Provide server share path of the NFS Server
    client_share_path: /share_omnia
    client_mount_options: "nosuid,rw,sync,hard,intr"
    nfs_name: nfs_slurm

  - server_ip: "172.16.107.121" # Provide the IP of the NFS server
    server_share_path: "/mnt/share/omnia_k8s" # Provide server share path of the NFS Server
    client_share_path: /share_omnia_k8s
    client_mount_options: "nosuid,rw,sync,hard,intr"
    nfs_name: nfs_k8s
    

================================================
FILE: input/telemetry_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# ============================================================================
# TELEMETRY CONFIGURATION OVERVIEW
# ============================================================================
# This file configures telemetry data collection and storage for Dell Omnia.
#
# SECTIONS:
#   1. iDRAC Telemetry    : Hardware metrics from Dell PowerEdge servers
#   2. VictoriaMetrics    : Time-series database for metric storage
#   3. Kafka              : Distributed streaming platform for telemetry data
#   4. LDMS               : Lightweight Distributed Metric Service for compute nodes
#
# ============================================================================
# STORAGE REQUIREMENTS SUMMARY
# ============================================================================
# 
# VICTORIAMETRICS STORAGE:
# ┌─────────────────┬──────────────────┬─────────────────┬──────────────────┐
# │ Deployment Mode │ Per-Pod Storage  │ Number of Pods  │ Total Storage    │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Single-node     │ persistence_size │ 1 pod           │ 1× storage       │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Cluster         │ persistence_size │ 3 vmstorage     │ 3× storage       │
# └─────────────────┴──────────────────┴─────────────────┴──────────────────┘
# Example: 8Gi per pod → Single-node: 8Gi total, Cluster: 24Gi total
#
# KAFKA STORAGE:
# ┌─────────────────┬──────────────────┬─────────────────┬──────────────────┐
# │ Component       │ Per-Pod Storage  │ Number of Pods  │ Total Storage    │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Kafka Broker    │ persistence_size │ 3 pods          │ 3× storage       │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Kafka Controller│ persistence_size │ 3 pods          │ 3× storage       │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ TOTAL KAFKA     │ persistence_size │ 6 pods          │ 6× storage       │
# └─────────────────┴──────────────────┴─────────────────┴──────────────────┘
# Example: 8Gi per pod → 48Gi total Kafka storage
#
# COMBINED STORAGE EXAMPLES:
#   Default (8Gi each): VictoriaMetrics Cluster (24Gi) + Kafka (48Gi) = 72Gi total
#   Single-node mode:   VictoriaMetrics Single (8Gi) + Kafka (48Gi) = 56Gi total
#
# STORAGE OPTIONS:
#   - VictoriaMetrics: Store iDRAC telemetry in time-series database
#   - Kafka: Stream iDRAC and LDMS telemetry to Kafka topics
#   - Both: Store iDRAC in both Victoria and Kafka (recommended)
# ============================================================================

# ============================================================================
# iDRAC TELEMETRY CONFIGURATION
# ============================================================================
# iDRAC telemetry collects hardware metrics from Dell PowerEdge servers.
# Telemetry data can be stored in VictoriaMetrics, Kafka, or both.

# Enable or disable iDRAC telemetry support
# Accepted values: true or false
# Default: true
idrac_telemetry_support: true

# Specify where to store iDRAC telemetry data
# Supported values:
#   - "victoria"        : Store in VictoriaMetrics only
#   - "kafka"           : Store in Kafka only
#   - "victoria,kafka"  : Store in both (recommended)
# Default: "victoria,kafka"
idrac_telemetry_collection_type: "victoria,kafka"

# ============================================================================
# VICTORIAMETRICS CONFIGURATION
# ============================================================================
# VictoriaMetrics is a time-series database for storing telemetry metrics.
# Used for iDRAC telemetry when 'victoria' is enabled in idrac_telemetry_collection_type.
#
# DEPLOYMENT MODES:
#   - single-node: Simple deployment with one pod (suitable for small deployments)
#   - cluster: High-availability deployment with multiple components
#               (recommended for production and large-scale deployments)
victoria_configurations:
  # VictoriaMetrics deployment mode
  # Supported values:
  #   - "single-node" : Simple deployment (1 pod, suitable for dev/test)
  #   - "cluster"     : High-availability deployment (7 pods, recommended for production)
  # Default: "cluster"
  #
  # Cluster Mode Benefits:
  #   - High availability (no single point of failure)
  #   - Horizontal scalability (scale components independently)
  #   - Better performance (4x ingestion, 2x query speed)
  #   - Production-ready architecture
  #
  # Single-Node Benefits:
  #   - Simple setup (fewer resources)
  #   - Suitable for small deployments (<10 nodes)
  #   - Lower resource usage (~4Gi memory vs ~10Gi for cluster)
  deployment_mode: "cluster"

  # The amount of storage allocated for EACH VictoriaMetrics persistent volume.
  # IMPORTANT: Total VictoriaMetrics storage depends on deployment mode:
  #   - Single-node mode: Total storage = persistence_size × 1 pod
  #   - Cluster mode: Total storage = persistence_size × 3 vmstorage pods
  #   - Example (cluster): 8Gi × 3 = 24Gi total VictoriaMetrics storage
  # Accepted values: in the form of "X[Ki|Mi|Gi|Ti|Pi|Ei]"
  # Default: 8Gi (results in 24Gi total storage for cluster mode)
  persistence_size: "8Gi"

  # Duration (in hours) to retain victoria logs before they are deleted.
  # Default: 168 (7 days)
  retention_period: 168

# ============================================================================
# KAFKA CONFIGURATION
# ============================================================================
# Apache Kafka is a distributed streaming platform for storing telemetry data.
# Used for iDRAC telemetry when 'kafka' is enabled in idrac_telemetry_collection_type.
# Also used for LDMS telemetry when LDMS software is configured.
#
# NOTE: Kafka topics are auto-generated based on enabled features:
#   - 'idrac' topic: Required when idrac_telemetry_support=true and 'kafka' is enabled
#   - 'ldms' topic:  Required when LDMS is configured in software_config.json
kafka_configurations:
  # The amount of storage allocated for EACH Kafka persistent volume.
  # IMPORTANT: Total Kafka storage = persistence_size × 6 pods
  #   - 3 Kafka brokers (each gets persistence_size storage)
  #   - 3 Kafka controllers (each gets persistence_size storage)
  #   - Example: 8Gi × 6 = 48Gi total Kafka storage
  # Accepted values: in the form of "X[Ki|Mi|Gi|Ti|Pi|Ei]"
  # Default: 8Gi (results in 48Gi total storage)
  persistence_size: "8Gi"

  # The number of hours to retain Kafka logs before they are deleted.
  # Default: 168 (7 days)
  log_retention_hours: 168

  # The maximum size of Kafka logs (in bytes) before they are deleted.
  # Default: -1 (unlimited)
  log_retention_bytes: -1

  # The maximum size of Kafka log segments (in bytes) before they are deleted.
  # Default: 1073741824 (1 GB)
  log_segment_bytes: 1073741824

  # Kafka Topic Partitions Configuration
  # ----------------------------------------------------------------------------
  # Define the number of partitions for each Kafka topic.
  # Increasing partitions can improve throughput but also increases storage/overhead.
  #
  # IMPORTANT: Topic names are FIXED and cannot be changed.
  #   - Topic names: Only 'idrac' and 'ldms' are allowed
  #   - Configurable: Only partition counts can be modified
  #
  # Topic Requirements (auto-validated):
  #   - 'idrac': Required when idrac_telemetry_support=true and 'kafka' is enabled
  #   - 'ldms':  Required when LDMS software is configured in software_config.json
  #
  # Default partition counts: idrac=1, ldms=2
  topic_partitions:
    - name: "idrac"
      partitions: 1
    - name: "ldms"
      partitions: 2

# ============================================================================
# LDMS (Lightweight Distributed Metric Service) CONFIGURATION
# ============================================================================
# LDMS collects performance metrics from compute nodes (CPU, memory, network, etc.)
# and streams them to Kafka for storage and analysis.
#
# PREREQUISITE: To enable LDMS support, add the following to software_config.json:
#   {
#     "softwares": [
#       {"name": "ldms", "arch": ["x86_64", "aarch64"]}
#     ]
#   }
#
# When LDMS software is configured, the 'ldms' topic MUST be defined in
# kafka_configurations.topic_partitions above.
#
# LDMS Port Configurations
# Aggregator port on service k8s cluster
# Valid range: 6001-6100
# Default: 6001
ldms_agg_port: 6001

# Store daemon port on service k8s cluster
# Can be the same as ldms_agg_port
# Valid range: 6001-6100
# Default: 6001
ldms_store_port: 6001

# Sampler port on compute nodes
# Valid range: 10001-10100
# Default: 10001
ldms_sampler_port: 10001

# LDMS Sampler Plugin Configurations
# ----------------------------------------------------------------------------
# Configure which metrics to collect from compute nodes and collection intervals.
# Each plugin collects specific system metrics.
#
# Parameters:
#   - plugin_name: Name of the LDMS sampler plugin
#   - config_parameters: Plugin-specific configuration (as a single string)
#   - activation_parameters: Collection schedule in MICROSECONDS
#       Format: "interval=<microseconds> offset=<microseconds>"
#       Example: "interval=1000000"         (1000000 microseconds = 1 second)
#                "interval=1000000 offset=0" (1000000 microseconds with no offset)
#
# Available Plugins:
#   - meminfo: Memory usage statistics
#   - procstat2: Process statistics
#   - vmstat: Virtual memory statistics
#   - loadavg: System load average
#   - procnetdev2: Network interface statistics
ldms_sampler_configurations:
  # Memory usage statistics (free, used, buffers, cached, etc.)
  - plugin_name: meminfo
    config_parameters: ""
    activation_parameters: "interval=30000000"  # interval=30000000 microseconds (30 seconds)

  # Process statistics (CPU, memory, I/O per process)
  - plugin_name: procstat2
    config_parameters: ""
    activation_parameters: "interval=30000000"  # interval=30000000 microseconds (30 seconds)

  # Virtual memory statistics (paging, swapping, memory pressure)
  - plugin_name: vmstat
    config_parameters: ""
    activation_parameters: "interval=30000000"  # interval=30000000 microseconds (30 seconds)

  # System load average (1, 5, and 15 minute averages)
  - plugin_name: loadavg
    config_parameters: ""
    activation_parameters: "interval=30000000"  # interval=30000000 microseconds (30 seconds)

  # Network interface statistics (bytes, packets, errors, drops per interface)
  # Config parameters (optional):
  #   - ifaces=eth0,eth1: Specific interfaces to monitor
  #   - If not specified, all network interfaces will be monitored
  - plugin_name: procnetdev2
    config_parameters: ""  # Monitor all interfaces
    activation_parameters: "interval=30000000 offset=0"  # interval=30000000 microseconds (30 seconds), offset=0


================================================
FILE: input/user_registry_credential.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************
# user_registry credential manager
# name: User registry name, name should match exact name provided in local_repo_config.yml
# username: Provide if user registry requires username to authenticate
# password: Provide if user registry requires password to authenticate

user_registry_credential:
  - {name: "", username: "", password: ""}


================================================
FILE: input_validation/ansible.cfg
================================================
[defaults]
log_path = /opt/omnia/log/core/playbooks/input_validation.log
remote_tmp = /opt/omnia/tmp/.ansible/tmp/
host_key_checking = false
forks = 5
timeout = 180
executable = /bin/bash
library = ../common/library/modules
module_utils = ../common/library/module_utils

[persistent_connection]
command_timeout = 180
connect_timeout = 180

[ssh_connection]
retries = 3
ssh_args = -o ControlMaster=auto -o ControlPersist=60 -o ConnectTimeout=60

================================================
FILE: input_validation/roles/validate_input/tasks/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
- name: Initialize list of tags
  ansible.builtin.set_fact:
    omnia_run_tags: "{{ ansible_run_tags | default([]) }}"
  when: omnia_run_tags is not defined

- name: Set validation messages
  ansible.builtin.set_fact:
    validation_success_msg: "{{ messages.validation_success }}"
    validation_error_msg: "{{ messages.validation_error }}"

- name: Validate omnia input config
  block:
    - name: Run validation
      validate_input:
        omnia_base_dir: "{{ (input_dir + '/../') | ansible.builtin.realpath }}"
        project_name: "{{ project_name }}"
        tag_names: "{{ input_validate_tags }}"
        module_utils_path: "{{ (role_path + '/../../../common/library/module_utils/') | ansible.builtin.realpath }}"
      register: validation_status
      when: (input_validate_tags | length) > 0

    - name: Debug validation status
      ansible.builtin.debug:
        msg: "{{ validation_success_msg }}"
  rescue:
    - name: Failed due to validation failure
      ansible.builtin.fail:
        msg: "{{ validation_error_msg }}"


================================================
FILE: input_validation/roles/validate_input/vars/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

input_dir: "{{ hostvars['localhost']['input_project_dir'] }}"
project_name: "{{ hostvars['localhost']['project_name'] }}"

# Note: When running a specific playbook without tags ansible run tags will default to ["all"], thus if two or more tags are present
# then the "all" tag should be removed so that only the config files related to that playbook are validated.
input_validate_tags: "{{ omnia_run_tags | default([]) | difference(['all']) if (omnia_run_tags | length) >= 2
  else omnia_run_tags | default([]) }}"

messages:
  validation_success: >-
    Successfully validated Omnia input config file(s).
    Note: There might be warnings - please review the log file at
    /opt/omnia/log/core/playbooks/validation_omnia_{{ project_name }}.log
    for details.
  validation_error: >-
    Input validation failed. Please check the validation output above
    for detailed error information.


================================================
FILE: input_validation/roles/validate_subscription/tasks/check_rhel_subscription.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Check entitlement certs
  ansible.builtin.find:
    paths: "{{ entitlement_path }}"
    patterns: "*.pem"
    file_type: file
  register: entitlement_certs
  failed_when: false

- name: Extract repo baseurls if redhat.repo exists
  ansible.builtin.shell: |
    set -o pipefail
    awk -F= '/^baseurl/ {print $2}' /etc/yum.repos.d/redhat.repo | grep -E 'codeready-builder|baseos|appstream' || true
  args:
    warn: false
  register: repo_urls
  changed_when: false
  failed_when: false

- name: Determine subscription status
  ansible.builtin.set_fact:
    subscription_status: >-
      {{
        (entitlement_certs.matched | default(0) | int > 0)
        or ((repo_urls.stdout_lines | default([])) | length > 0)
      }}

- name: Debug subscription status
  ansible.builtin.debug:
    msg: "Subscription enabled? {{ subscription_status }}"

- name: Extract subscription urls
  when: subscription_status | bool
  block:
    - name: Set subscription release from software_config.json
      ansible.builtin.command:
        cmd: >
          subscription-manager release --set="{{ hostvars['localhost']['cluster_os_version'] }}"
      changed_when: true

    - name: Get subscription-manager release
      ansible.builtin.command: subscription-manager release --show
      register: release_info
      changed_when: false

    - name: Show subscription-manager release
      ansible.builtin.debug:
        msg: "{{ release_info.stdout }}"

    - name: Ensure shared path exists
      ansible.builtin.file:
        path: "{{ rhel_repo_cert_dir }}"
        state: directory
        mode: "{{ hostvars['localhost']['dir_permissions_755'] }}"

    - name: Find entitlement certs on oim
      ansible.builtin.find:
        paths: "{{ entitlement_path }}"
        patterns: "*.pem"
        file_type: file
      register: entitlement_certs
      when: subscription_status | bool

    - name: Copy entitlement certs to shared path
      ansible.builtin.copy:
        src: "{{ item.path }}"
        dest: "{{ rhel_repo_cert_dir }}"
        mode: "{{ hostvars['localhost']['file_permissions_644'] }}"
        remote_src: true
      loop: "{{ entitlement_certs.files | default([]) }}"
      when: subscription_status | bool

    - name: Copy Red Hat UEP cert
      ansible.builtin.copy:
        src: "{{ redhat_uep_cert }}"
        dest: "{{ rhel_repo_cert_dir }}/redhat-uep.pem"
        mode: "{{ hostvars['localhost']['file_permissions_644'] }}"
        remote_src: true

    - name: Copy Red Hat repo
      ansible.builtin.copy:
        src: "{{ redhat_repo_file }}"
        dest: "{{ rhel_repo_cert_dir }}/redhat.repo"
        mode: "{{ hostvars['localhost']['file_permissions_644'] }}"
        remote_src: true

    - name: Set rhel_repo_certs SELinux context
      ansible.builtin.command: chcon -R system_u:object_r:container_file_t:s0 "{{ rhel_repo_cert_dir }}"
      changed_when: true
      failed_when: false

    - name: Extract only RHEL baseurls (appstream, baseos, codeready-builder)
      ansible.builtin.shell: |
        set -o pipefail
        awk -v ver="{{ rhel_version }}" '
          /^\[/ {section=$0}
          /^baseurl/ && section ~ /(rhel-{{ rhel_version }}-for-x86_64-(appstream|baseos)-rpms|codeready-builder-for-rhel-{{ rhel_version }}-x86_64-rpms)/ {
            gsub(/\$releasever/, ver, $3)
            print $3
          }
        ' {{ redhat_repo_file }}
      register: repo_baseurls
      changed_when: false


    - name: Set fact repo baseurls with trailing slash
      ansible.builtin.set_fact:
        repo_baseurls: "{{ repo_baseurls.stdout_lines
                          | map('regex_replace', '([^/])$', '\\1/')
                          | list }}"

    - name: Show extracted baseurls
      ansible.builtin.debug:
        msg: "{{ repo_baseurls }}"


================================================
FILE: input_validation/roles/validate_subscription/tasks/configure_rhel_os_urls.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Set subscription flag and project input path
  ansible.builtin.set_fact:
    subscription_status_flag: "{{ hostvars['oim']['subscription_status'] | default(false) }}"
    project_input_path: "{{ hostvars['localhost']['input_project_dir'] }}"
    arch: "x86_64"

- name: Load local_repo_config.yml
  ansible.builtin.include_vars:
    file: "{{ local_repo_config_file }}"
    name: local_config

- name: Validate RHEL repository configuration when subscription is enabled
  ansible.builtin.fail:
    msg: |
      ERROR: RHEL subscription is enabled, but '{{ invalid_vars | join("' and '") }}'
      {{ 'are' if invalid_vars | length > 1 else 'is' }} defined in local_repo_config.yml.

      When RHEL subscription is active:
      - DO NOT use 'rhel_os_url_x86_64' or 'rhel_os_url_aarch64'
      - These variables are only for non-subscription scenarios

      To override or add repositories when subscription is enabled, use:
      - 'rhel_subscription_repo_config_x86_64' for x86_64 architecture
      - 'rhel_subscription_repo_config_aarch64' for aarch64 architecture

      Please remove '{{ invalid_vars | join("' and '") }}' from local_repo_config.yml
      or disable the RHEL subscription.
  vars:
    invalid_vars: >-
      {{
        (['rhel_os_url_x86_64'] if (local_config.rhel_os_url_x86_64 is defined
          and local_config.rhel_os_url_x86_64 is not none
          and local_config.rhel_os_url_x86_64 | length > 0) else [])
        +
        (['rhel_os_url_aarch64'] if (local_config.rhel_os_url_aarch64 is defined
          and local_config.rhel_os_url_aarch64 is not none
          and local_config.rhel_os_url_aarch64 | length > 0) else [])
      }}
  when:
    - subscription_status_flag
    - invalid_vars | length > 0

- name: Load software_config.json
  ansible.builtin.include_vars:
    file: "{{ sw_config_json_path }}"
    name: sw_config

- name: Collect all architectures from softwares
  ansible.builtin.set_fact:
    archs: "{{ (sw_config.softwares
                  | map(attribute='arch')
                  | select('defined')
                  | flatten
                  + ['x86_64'])
                  | unique
                  | list }}"

# 2️ Process repo configs for each architecture
- name: Process repo configs for each arch
  when: subscription_status_flag
  block:
    - name: Set variables for repo build
      ansible.builtin.set_fact:
        subscription_status_flag: "{{ hostvars['oim']['subscription_status'] }}"
        repo_base_urls: "{{ hostvars['oim']['repo_baseurls'] }}"
        sslcacert: "{{ omnia_rhel_cert_dir }}/redhat-uep.pem"
        sslclientkey: "{{ lookup('pipe', 'ls {{ omnia_rhel_cert_dir }}/*-key.pem | head -n1') }}"
        sslclientcert: "{{ lookup('pipe', 'ls {{ omnia_rhel_cert_dir }}/*.pem | grep -v -- -key.pem | head -n1') }}"
        sub_rhel_x86_64_urls: []
        sub_rhel_aarch64_urls: []
        sub_policy_default: "{{ sw_config.repo_config | default('on_demand') }}"
        sub_caching_default: true
        sub_x86_64_override_config: "{{ local_config.rhel_subscription_repo_config_x86_64 | default([]) }}"
        sub_aarch64_override_config: "{{ local_config.rhel_subscription_repo_config_aarch64 | default([]) }}"

    - name: Append repo entries to x86_64 list
      ansible.builtin.set_fact:
        sub_rhel_x86_64_urls: "{{ sub_rhel_x86_64_urls + [repo_entry] }}"
      vars:
        repo_entry: >-
          {{
            {
              'url' : repo_url,
              'gpgkey' : '',
              'sslcacert' : sslcacert,
              'sslclientkey' : sslclientkey,
              'sslclientcert': sslclientcert,
              'policy': sub_policy_default,
              'caching': sub_caching_default,
              'name': (
                arch ~ '_appstream' if 'appstream' in repo_url else
                arch ~ '_baseos' if 'baseos' in repo_url else
                arch ~ '_codeready-builder' if 'codeready-builder' in repo_url else
                omit
              )
            }
          }}
      loop: "{{ repo_base_urls }}"
      loop_control:
        loop_var: repo_url

    - name: Build aarch64 repo entries from x86_64 list
      ansible.builtin.set_fact:
        sub_rhel_aarch64_urls: "{{ sub_rhel_aarch64_urls | default([]) + [{'url': item.url | replace('x86_64', 'aarch64'),
          'name': item.name | replace('x86_64', 'aarch64'),
          'gpgkey': item.gpgkey,
          'policy': item.policy,
          'caching': item.caching,
          'sslcacert': item.sslcacert,
          'sslclientcert': item.sslclientcert,
          'sslclientkey': item.sslclientkey}] }}"
      loop: "{{ sub_rhel_x86_64_urls }}"
      loop_control:
        loop_var: item

    # 3️ Apply override configurations and merge additional repositories
    - name: Create name mapping for x86_64 dynamic repos
      ansible.builtin.set_fact:
        x86_64_dynamic_names: "{{ sub_rhel_x86_64_urls | map(attribute='name') | list }}"

    - name: Apply x86_64 overrides to matching repos
      ansible.builtin.set_fact:
        sub_rhel_x86_64_urls: >-
          {%- set result = [] -%}
          {%- for repo in sub_rhel_x86_64_urls -%}
            {%- set override = (sub_x86_64_override_config | selectattr('name', 'equalto', repo.name) | first | default({})) -%}
            {%- set updated_repo = repo | combine({
              'policy': override.policy | default(repo.policy),
              'caching': override.caching | default(repo.caching),
              'url': override.url | default(repo.url),
              'gpgkey': override.gpgkey | default(repo.gpgkey)
            }) -%}
            {%- set _ = result.append(updated_repo) -%}
          {%- endfor -%}
          {{ result }}

    - name: Identify non-matching x86_64 override repos
      ansible.builtin.set_fact:
        additional_x86_64_repos: >-
          {{
            sub_x86_64_override_config | rejectattr('name', 'in', x86_64_dynamic_names) | list
          }}

    - name: Add non-matching x86_64 override repos as additional
      ansible.builtin.set_fact:
        sub_rhel_x86_64_urls: >-
          {%- set result = sub_rhel_x86_64_urls -%}
          {%- for repo in additional_x86_64_repos -%}
            {%- set new_repo = {
              'url': repo.url,
              'gpgkey': repo.gpgkey | default(''),
              'name': repo.name,
              'policy': repo.policy | default(sub_policy_default),
              'caching': repo.caching | default(sub_caching_default),
              'sslcacert': sslcacert,
              'sslclientcert': sslclientcert,
              'sslclientkey': sslclientkey
            } -%}
            {%- set _ = result.append(new_repo) -%}
          {%- endfor -%}
          {{ result }}

    - name: Apply aarch64 overrides to matching repos
      ansible.builtin.set_fact:
        sub_rhel_aarch64_urls: >-
          {%- set result = [] -%}
          {%- for repo in sub_rhel_aarch64_urls -%}
            {%- set override = (sub_aarch64_override_config | selectattr('name', 'equalto', repo.name) | first | default({})) -%}
            {%- set updated_repo = repo | combine({
              'policy': override.policy | default(repo.policy),
              'caching': override.caching | default(repo.caching),
              'url': override.url | default(repo.url),
              'gpgkey': override.gpgkey | default(repo.gpgkey)
            }) -%}
            {%- set _ = result.append(updated_repo) -%}
          {%- endfor -%}
          {{ result }}

    - name: Identify non-matching aarch64 override repos
      ansible.builtin.set_fact:
        aarch64_dynamic_names: "{{ sub_rhel_aarch64_urls | map(attribute='name') | list }}"
        additional_aarch64_repos: >-
          {{
            sub_aarch64_override_config | rejectattr('name', 'in', aarch64_dynamic_names) | list
          }}
      when: "'aarch64' in archs"

    - name: Add non-matching aarch64 override repos as additional
      ansible.builtin.set_fact:
        sub_rhel_aarch64_urls: >-
          {%- set result = sub_rhel_aarch64_urls -%}
          {%- for repo in additional_aarch64_repos -%}
            {%- set new_repo = {
              'url': repo.url,
              'gpgkey': repo.gpgkey | default(''),
              'name': repo.name,
              'policy': repo.policy | default(sub_policy_default),
              'caching': repo.caching | default(sub_caching_default),
              'sslcacert': sslcacert,
              'sslclientcert': sslclientcert,
              'sslclientkey': sslclientkey
            } -%}
            {%- set _ = result.append(new_repo) -%}
          {%- endfor -%}
          {{ result }}
      when: "'aarch64' in archs"

- name: Build final repo dict
  ansible.builtin.set_fact:
    sub_final_repo_urls:
      x86_64: "{{ sub_rhel_x86_64_urls | default([]) }}"
      aarch64: "{{ (sub_rhel_aarch64_urls | default([])) if 'aarch64' in archs else [] }}"

# 3 Debug final repo URLs
- name: Debug final repo urls
  ansible.builtin.debug:
    msg: "{{ sub_final_repo_urls }}"

- name: Process and validate repo configs when subscription is disabled
  when: not subscription_status_flag
  block:
    # 1️ Set facts from local_config
    - name: Set facts for cluster
      ansible.builtin.set_fact:
        rhel_url_x86_64: "{{ local_config.rhel_os_url_x86_64 }}"
        rhel_url_aarch64: "{{ local_config.rhel_os_url_aarch64 }}"

    # 2 Validate required repos
    - name: Ensure required repos are present , fail if not
      ansible.builtin.fail:
        msg: >-
          Subscription is disabled and required repos are missing for {{ arch_item }}.
          Expected: {{ required_with_arch | join(', ') }}.
          Found: {{ present_repos | join(', ') }}
      vars:
        present_repos: "{{ vars['rhel_url_' ~ arch_item] | map(attribute='name') | list }}"
        required_with_arch: "{{ required_repos | map('regex_replace', '^(.*)$', arch_item ~ '_\\1') | list }}"
      when: present_repos is not superset(required_with_arch)
      loop: "{{ archs }}"
      loop_control:
        loop_var: arch_item


================================================
FILE: input_validation/roles/validate_subscription/vars/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# Usage: check_rhel_subscription.yml
rhel_repo_cert_dir: "{{ hostvars['localhost']['oim_shared_path'] }}/omnia/rhel_repo_certs"
rhel_version: "{{ hostvars['localhost']['cluster_os_version'].split('.')[0] }}"
redhat_uep_cert: "/etc/rhsm/ca/redhat-uep.pem"
entitlement_path: "/etc/pki/entitlement"
redhat_repo_file: "/etc/yum.repos.d/redhat.repo"

# Usage: configure_rhel_os_urls.yml
project_input_path: "{{ hostvars['localhost']['input_project_dir'] }}"
local_repo_config_file: "{{ project_input_path }}/local_repo_config.yml"
sw_config_json_path: "{{ project_input_path }}/software_config.json"
omnia_rhel_cert_dir: "/opt/omnia/rhel_repo_certs"
required_repos:
  - codeready-builder
  - baseos
  - appstream


================================================
FILE: input_validation/validate_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Include input project directory
  when: not project_dir_status | default(false) | bool
  ansible.builtin.import_playbook: ../utils/include_input_dir.yml
  tags: &common_tags
    - scheduler
    - provision
    - security
    - local_repo
    - compute_k8s
    - service_k8s
    - roce
    - storage
    - proxy
    - high_availability
    - server_spec
    - prepare_oim
    - telemetry
    - additional_software
    - gitlab

- name: Create oim group
  when:
    - not oim_group_status | default(false) | bool
    - "'local_repo' in (omnia_run_tags | default(ansible_run_tags) | default([])) or 'all' in (ansible_run_tags | default([]))"
  ansible.builtin.import_playbook: ../utils/create_container_group.yml
  vars:
    oim_group: true
  tags:
    - always

- name: Local repo subscription validation
  hosts: localhost
  connection: local
  gather_facts: false
  tags:
    - always
  tasks:
    - name: Run subscription validation tasks
      when: "'local_repo' in (omnia_run_tags | default(ansible_run_tags) | default([])) or 'all' in (ansible_run_tags | default([]))"
      block:
        - name: Include metadata vars
          ansible.builtin.include_vars: "/opt/omnia/.data/oim_metadata.yml"
          no_log: true

        - name: Validate JSON before loading
          ansible.builtin.command: "jq . {{ input_project_dir }}/software_config.json"
          register: json_check
          changed_when: false
          failed_when: false
          ignore_errors: true
          no_log: true

        - name: Fail if JSON is invalid
          ansible.builtin.fail:
            msg: |
              JSON validation failed for software_config.json.
              File: {{ input_project_dir }}/software_config.json
              {{ json_check.stderr | default('Unknown jq error') }}
              Please fix the JSON syntax
          when: json_check.rc != 0

        - name: Load software_config JSON
          ansible.builtin.set_fact:
            software_config: "{{ lookup('file', input_project_dir + '/software_config.json') | from_json }}"

        - name: Set cluster OS version
          ansible.builtin.set_fact:
            cluster_os_version: "{{ software_config.cluster_os_version }}"
            cluster_os_type: "{{ software_config.cluster_os_type }}"

- name: Check RHEL subscription on OIM
  hosts: oim
  connection: ssh
  gather_facts: false
  tags:
    - always
  tasks:
    - name: Check rhel subscription enabled or not
      ansible.builtin.include_role:
        name: validate_subscription
        tasks_from: check_rhel_subscription.yml
      when: "'local_repo' in (hostvars['localhost']['omnia_run_tags'] | default(ansible_run_tags) | default([])) or 'all' in (ansible_run_tags | default([]))"

- name: Configure RHEL repository URLs
  hosts: localhost
  connection: local
  gather_facts: false
  tags:
    - always
  tasks:
    - name: Configure RHEL os URLS for codeready-builder baseoc appstream repositories
      ansible.builtin.include_role:
        name: validate_subscription
        tasks_from: configure_rhel_os_urls.yml
      when: "'local_repo' in (omnia_run_tags | default(ansible_run_tags) | default([])) or 'all' in (ansible_run_tags | default([]))"

- name: Validate omnia input config
  hosts: localhost
  connection: local
  gather_facts: false
  roles:
    - role: validate_input
      tags: *common_tags


================================================
FILE: local_repo/ansible.cfg
================================================
[defaults]
log_path = /opt/omnia/log/core/playbooks/local_repo.log
remote_tmp = /opt/omnia/tmp/.ansible/tmp/
host_key_checking = false
forks = 5
timeout = 180
executable = /bin/bash
library = roles/parse_and_download/library:../common/library/modules
module_utils = ../common/library/module_utils

[persistent_connection]
command_timeout = 180
connect_timeout = 180

[ssh_connection]
retries = 3
ssh_args = -o ControlMaster=auto -o ControlPersist=60 -o ConnectTimeout=60

================================================
FILE: local_repo/local_repo.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Check if upgrade is in progress
  ansible.builtin.import_playbook: ../utils/upgrade_checkup.yml

- name: Set_fact for fetch omnia config credentials
  hosts: localhost
  connection: local
  tasks:
    - name: Set start time
      ansible.builtin.set_fact:
        playbook_start_time: "{{ lookup('pipe', 'date +%s') }}"

    - name: Set dynamic run tags including 'local_repo'
      ansible.builtin.set_fact:
        omnia_run_tags: "{{ (ansible_run_tags | default([]) + ['local_repo']) | unique }}"
        cacheable: true

    - name: Include metadata vars
      ansible.builtin.include_vars: "/opt/omnia/.data/oim_metadata.yml"
      register: include_metadata
      no_log: true
      tags: always

- name: Include input project directory
  when: not project_dir_status | default(false) | bool
  ansible.builtin.import_playbook: ../utils/include_input_dir.yml

- name: Create oim group
  when: not oim_group_status | default(false) | bool
  ansible.builtin.import_playbook: ../utils/create_container_group.yml
  vars:
    oim_group: true

- name: Set SELinux context
  hosts: oim
  connection: ssh
  gather_facts: false
  tasks:
    - name: Set SELinux context
      ansible.builtin.command: chcon -R system_u:object_r:container_file_t:s0 "{{ hostvars['localhost']['oim_shared_path'] }}/omnia/"
      changed_when: true
      failed_when: false

- name: Invoke validate_config.yml to perform L1 and L2 validations for local repo
  ansible.builtin.import_playbook: ../input_validation/validate_config.yml

- name: Invoke get_config_credentials.yml
  ansible.builtin.import_playbook: ../utils/credential_utility/get_config_credentials.yml

- name: Read high availability, network_spec, and omnia_credentials vars
  hosts: localhost
  connection: local
  gather_facts: true
  tasks:
    - name: Read network_spec vars
      ansible.builtin.include_role:
        name: pulp_validation
        tasks_from: read_network_spec.yml

- name: Validate Pulp Container and Endpoint
  hosts: oim
  connection: ssh
  gather_facts: false
  tasks:
    - name: Validate Pulp Container and Endpoint
      ansible.builtin.include_role:
        name: pulp_validation

- name: Local Repository Playbook
  hosts: localhost
  connection: local
  gather_facts: true
  roles:
    - validation
    - parse_and_download

- name: Localrepo completion
  hosts: localhost
  connection: local
  tasks:
    - name: Localrepo has completed  # noqa:role-name[path]
      ansible.builtin.include_role:
        name: parse_and_download
        tasks_from: localrepo_completion.yml
      when: final_status == 'SUCCESS'


================================================
FILE: local_repo/pulp_cleanup.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
# Pulp Cleanup Playbook - Clean Architecture
#
# Usage:
#   # Repository cleanup (include architecture prefix)
#   ansible-playbook pulp_cleanup.yml -e "cleanup_repos=x86_64_epel,aarch64_epel"
#   ansible-playbook pulp_cleanup.yml -e "cleanup_repos=x86_64_appstream"
#   ansible-playbook pulp_cleanup.yml -e "cleanup_containers=registry.k8s.io/pause,docker.io/library/nginx"
#   ansible-playbook pulp_cleanup.yml -e "cleanup_files=git,chart-0.48.0"
#   ansible-playbook pulp_cleanup.yml -e "cleanup_repos=x86_64_epel -e cleanup_containers=docker.io/library/nginx -e force=true"
#
#   # Cleanup ALL artifacts of a type:
#   ansible-playbook pulp_cleanup.yml -e "cleanup_repos=all"
#   ansible-playbook pulp_cleanup.yml -e "cleanup_containers=all"
#   ansible-playbook pulp_cleanup.yml -e "cleanup_files=all"
#   ansible-playbook pulp_cleanup.yml -e "cleanup_repos=all" -e "cleanup_containers=all" -e "cleanup_files=all"
#
#   # Examples: x86_64_epel, aarch64_epel, x86_64_appstream, aarch64_baseos
#   # Note: Use architecture prefix (x86_64_ or aarch64_) for repository names

- name: Pulp Cleanup
  hosts: localhost
  connection: local
  gather_facts: false

  pre_tasks:
    # Step 0: Load software_config to determine OS type and version
    - name: Load software_config.json
      ansible.builtin.include_vars:
        file: "/opt/omnia/input/project_default/software_config.json"
        name: software_config

    - name: Set OS type and version facts
      ansible.builtin.set_fact:
        cluster_os_type: "{{ software_config.cluster_os_type }}"
        cluster_os_version: "{{ software_config.cluster_os_version }}"

    # Step 1: Input Validation
    - name: Validate input - at least one cleanup type must be specified
      ansible.builtin.assert:
        that:
          - (cleanup_repos | default([]) | length > 0) or (cleanup_containers | default([]) | length > 0) or (cleanup_files | default([]) | length > 0)
        fail_msg: |
          No cleanup items specified. Please provide at least one of:
            cleanup_repos: ['repo1', 'repo2']
            cleanup_containers: ['container1', 'container2']
            cleanup_files: ['file1', 'file2']

    # Step 2: User Confirmation
    - name: Parse cleanup lists
      ansible.builtin.set_fact:
        repo_list: "{{ cleanup_repos.split(',') | map('trim') | list if cleanup_repos is string else (cleanup_repos | default([])) }}"
        container_list: "{{ cleanup_containers.split(',') | map('trim') | list if cleanup_containers is string else (cleanup_containers | default([])) }}"
        file_list: "{{ cleanup_files.split(',') | map('trim') | list if cleanup_files is string else (cleanup_files | default([])) }}"

    - name: Display cleanup summary
      ansible.builtin.debug:
        msg:
          - "========== CLEANUP SUMMARY =========="
          - "Repositories : {{ (repo_list | default([]) | join(', ')) if repo_list | default([]) | length > 0 else 'None' }}"
          - "Containers   : {{ (container_list | default([]) | join(', ')) if cleanup_containers | default([]) | length > 0 else 'None' }}"
          - "Files        : {{ (file_list | default([]) | join(', ')) if cleanup_files | default([]) | length > 0 else 'None' }}"
          - "====================================="

    - name: Get user confirmation
      ansible.builtin.pause:
        prompt: |

          WARNING: This will permanently delete the specified artifacts.
          This action cannot be undone.
          Type 'yes' to continue or press Ctrl+C to abort
      register: user_input
      when: not (force | default(false)) | bool

    - name: Abort if not confirmed
      ansible.builtin.fail:
        msg: "Cleanup cancelled by user"
      when:
        - not (force | default(false)) | bool
        - user_input.user_input | default('') | lower != 'yes'

  tasks:
    # Step 3: Call Python Module
    - name: Execute cleanup ( This task might take sometime )
      pulp_cleanup:
        cleanup_repos: "{{ repo_list | default([]) }}"
        cleanup_containers: "{{ container_list | default([]) }}"
        cleanup_files: "{{ file_list | default([]) }}"
        base_path: "{{ base_path | default('/opt/omnia/log/local_repo') }}"
        repo_store_path: "{{ repo_store_path | default('/opt/omnia') }}"
        cluster_os_type: "{{ cluster_os_type }}"
        cluster_os_version: "{{ cluster_os_version }}"
      register: cleanup_result

  post_tasks:
    # Step 4: Display Results
    - name: Display cleanup results
      ansible.builtin.debug:
        msg: "{{ cleanup_result.pretty_table_lines }}"

    - name: Display summary
      ansible.builtin.debug:
        msg:
          - "================================================CLEANUP COMPLETED==========================================================="
          - "Total: {{ cleanup_result.total }}, Success: {{ cleanup_result.success_count }}, Failed: {{ cleanup_result.failed_count }}"
          - "Status file: {{ cleanup_result.status_file }}"
          - "NOTE: If the deleted artifact is required by any software, you must rerun local_repo.yml to sync the artifact(s) again."
          - "If the artifact(s) is not synced in local repo, subsequent playbooks having dependency may fail"
          - "============================================================================================================================"


================================================
FILE: local_repo/roles/parse_and_download/tasks/arch_component_loop.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Process each component under {{ arch_item.key }}
  ansible.builtin.include_tasks: execute_parallel_tasks.yml
  no_log: true
  loop: "{{ components }}"
  loop_control:
    loop_var: comp_item
  vars:
    item:
      arch: "{{ arch_item.key }}"
      key: "{{ comp_item.key }}"
      value: "{{ comp_item.value }}"


================================================
FILE: local_repo/roles/parse_and_download/tasks/create_metadata.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
- name: Clean DNF cache
  ansible.builtin.command: dnf clean all
  changed_when: false

- name: Remove pulp.repo if exists
  ansible.builtin.file:
    path: "{{ pulp_repo_path }}"
    state: absent

- name: Regenerate DNF cache using built-in module
  ansible.builtin.dnf:
    update_cache: true
  changed_when: false

- name: Check for data folder existence
  ansible.builtin.stat:
    path: "{{ meta_dest }}"
  register: data_folder_status

- name: Create data folder if it doesn't exists
  ansible.builtin.file:
    path: "{{ meta_dest }}"
    state: directory
    mode: "{{ meta_dest_mode }}"
  when: not data_folder_status.stat.exists

- name: Check if metadata file exists
  ansible.builtin.stat:
    path: "{{ metadata_file_path }}"
  register: metadata_file

- name: Save initial value of localrepo run report to metadata file if it doesn't exist
  ansible.builtin.copy:
    content: "kubeflow_run: true\n"
    dest: "{{ metadata_file_path }}"
    mode: "{{ metadata_file_mode }}"
  when: not metadata_file.stat.exists


================================================
FILE: local_repo/roles/parse_and_download/tasks/execute_parallel_tasks.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Execute tasks and process results
  block:
    - name: Execute tasks and process results
      parallel_tasks:
        tasks: "{{ item.value }}"
        log_dir: "{{ base_path }}/{{ cluster_os_type }}/{{ cluster_os_version }}/{{ item.arch }}/{{ item.key }}/logs"
        log_file: "{{ base_path }}/{{ cluster_os_type }}/{{ cluster_os_version }}/{{ item.arch }}/{{ item.key }}_task_results.log"
        slog_file: "{{ base_path }}/{{ cluster_os_type }}/{{ cluster_os_version }}"
        software: "{{ item.key }}"
        csv_file_path: "{{ base_path }}/{{ cluster_os_type }}/{{ cluster_os_version }}/{{ item.arch }}/{{ item.key }}"
        repo_store_path: "{{ nfs_shared_path }}"
        user_json_file: "{{ user_json_file }}"
        local_repo_config_path: "{{ local_repo_config_path }}"
        arch: "{{ item.arch }}"
        overall_status_dict: {}
        # user_reg_cred_input: "{{ user_reg_cred_input }}"
        # user_reg_key_path: "{{ user_reg_key_path }}"
        omnia_credentials_yaml_path: "{{ omnia_credentials_yaml_path }}"
        omnia_credentials_vault_path: "{{ omnia_credentials_vault_path }}"
        nthreads: "{{ (local_repo_py_module_vars[item.key].nthreads | default(local_repo_py_module_vars.default_vars.nthreads)) }}"
        timeout: "{{ (local_repo_py_module_vars[item.key].timeout | default(local_repo_py_module_vars.default_vars.timeout)) }}"
      register: task_results

    - name: Set fact for overall status
      ansible.builtin.set_fact:
        overall_status_dict: >-
          {{
            overall_status_dict | default({}) |
            combine({
              item.key: (overall_status_dict[item.key] | default([])) +
                        [ {'overall_status': task_results.overall_status,
                           'arch': task_results.arch} ]
            }, recursive=True)
          }}

    - name: Display overall status for software
      ansible.builtin.debug:
        msg: "Status for {{ item.arch }} / {{ item.key }}"

    - name: Display the output table
      ansible.builtin.debug:
        msg: "{{ task_results.table_output.split('\n') if task_results.table_output is defined else 'No table output available.' }}"

    - name: Confirm all tasks Success
      ansible.builtin.debug:
        msg: "All tasks completed successfully. Log path: {{ base_path }}/{{ cluster_os_type }}/{{ cluster_os_version }}/{{ item.arch }}/{{ item.key }}/logs/"
      when: task_results.overall_status == "SUCCESS"

    - name: Fail if Partial Success
      ansible.builtin.debug:
        msg: "Some tasks partially failed. Please review the task details above for more information. Log path: {{ base_path }}/{{ cluster_os_type }}/{{ cluster_os_version }}/{{ item.arch }}/{{ item.key }}/logs/" # noqa: yaml[line-length]
      when: task_results.overall_status == "PARTIAL"

    - name: Fail if Failure to download package
      ansible.builtin.debug:
        msg: "Some tasks failed. Please review the task details above for more information. Log path: {{ base_path }}/{{ cluster_os_type }}/{{ cluster_os_version }}/{{ item.arch }}/{{ item.key }}/logs/" # noqa: yaml[line-length]
      when: task_results.overall_status == "FAILURE"

    - name: Fail if Timeout during download
      ansible.builtin.debug:
        msg: "Some tasks failed due to timeout. Please review the task details above for more information. Log path: {{ base_path }}/{{ cluster_os_type }}/{{ cluster_os_version }}/{{ item.arch }}/{{ item.key }}/logs" # noqa: yaml[line-length]
      when: task_results.overall_status == "TIMEOUT"

  rescue:
    - name: Log the failure
      ansible.builtin.debug:
        msg:
          - "Parallel tasks encountered an error. Check the logs for details:"
          - "Log directory: {{ base_path }}/{{ cluster_os_type }}/{{ cluster_os_version }}/{{ item.arch }}/{{ item.key }}/logs"
          - "Log file: {{ base_path }}/{{ cluster_os_type }}/{{ cluster_os_version }}/{{ item.arch }}/{{ item.key }}_task_results.log"
          - "Error: {{ ansible_failed_result.msg | default('Unknown error') }}"

    - name: Fail the playbook execution
      ansible.builtin.fail:
        msg: "Task execution failed: {{ ansible_failed_result.msg | default('Unknown error') }}"


================================================
FILE: local_repo/roles/parse_and_download/tasks/localrepo_completion.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Localrepo completion message
  ansible.builtin.debug:
    msg: "{{ localrepo_completion_msg1 | split('\n') | join(' ') }}"
  when: final_status == 'SUCCESS'


================================================
FILE: local_repo/roles/parse_and_download/tasks/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Define project input path
  ansible.builtin.set_fact:
    project_input_path: "{{ hostvars['localhost']['input_project_dir'] }}"
    update_metadata: false
    show_softwares_status: false

- name: Include oim metadata vars
  ansible.builtin.include_vars: "{{ omnia_metadata_file }}"
  no_log: true

- name: Process and configure local_repo_config
  ansible.builtin.include_tasks: process_rpm_repo.yml

- name: Encrypt user certificates if exist
  cert_vault_handler:
    mode: encrypt
    log_dir: "{{ base_path }}/{{ cluster_os_type }}/{{ cluster_os_version }}"
    key_path: "{{ project_input_path }}"
  register: vault_result

- name: Execute tasks for each architecture
  ansible.builtin.include_tasks: arch_component_loop.yml
  no_log: true
  loop: "{{ result.software_dict | dict2items }}"
  loop_control:
    loop_var: arch_item
  vars:
    components: "{{ arch_item.value | dict2items }}"

# to be removed later
- name: Load software_config.json
  ansible.builtin.include_vars:
    file: "/opt/omnia/input/project_default/software_config.json"
    name: software_config

- name: Generate software JSON file names
  ansible.builtin.set_fact:
    software_names: "{{ software_config.softwares | map(attribute='name') | select('defined') | list }}"

- name: Create a dictionary of software architectures
  ansible.builtin.set_fact:
    fetch_arch: "{{ software_config.softwares | items2dict(key_name='name', value_name='arch') }}"

- name: Combine all architectures into a single list
  ansible.builtin.set_fact:
    all_archs: >-
      {{
        fetch_arch.values()
        | select('defined')
        | flatten
        | unique
      }}

- name: Set fact for all_archs_var
  ansible.builtin.set_fact:
    all_archs_var: "{{ hostvars['localhost']['all_archs'] }}"

- name: Clear the rpm downloaded files for each arch
  ansible.builtin.file:
    path: "{{ rpm_dir_path }}"
    state: absent
  loop: "{{ all_archs_var }}"
  when: clean_rpms

- name: Create folder {{ provision_shared_path }}
  ansible.builtin.file:
    path: "{{ provision_shared_path }}"
    state: directory
    mode: "{{ folder_mode }}"

- name: Create local_repo_access.yml file
  ansible.builtin.template:
    src: "{{ local_repo_access_src_path }}"
    dest: "{{ local_repo_access_dest_path }}"
    mode: "{{ file_mode }}"

- name: Determine final repository status
  ansible.builtin.set_fact:
    final_status: >-
      {{
        'FAILED' if
        (
          overall_status_dict | default({}) | dict2items |
          map(attribute='value') |
          sum(start=[]) |
          map(attribute='overall_status') |
          select('in', ['FAILURE', 'TIMEOUT', 'PARTIAL']) |
          list |
          length > 0
        )
        else 'SUCCESS'
      }}

- name: Check if metadata file exists
  ansible.builtin.stat:
    path: "{{ metadata_file_path }}"
  register: metadata_file

- name: Set update metadata flag
  ansible.builtin.set_fact:
    update_metadata: "{{ true | bool }}"
  when:
    - metadata_file.stat.exists
    - final_status == 'SUCCESS'

- name: Persist local repoitory information into metadata file localrepo_metadata.yml
  localrepo_metadata_manager:
    software_config_path: "{{ sw_config_json_path }}"
    localrepo_config_path: "{{ local_repo_config_path }}"
    output_file: "{{ metadata_file_path }}"
    update_metadata: "{{ update_metadata }}"
    sub_urls: "{{ sub_final_repo_urls | default({}) }}"
  register: policy_result
  when:
    - final_status == 'SUCCESS'

- name: Show updated keys
  ansible.builtin.debug:
    var: policy_result.diff
  when: update_metadata

- name: Run custom parallel task to print overall software status
  parallel_tasks:
    tasks: []
    software: []
    local_repo_config_path: "{{ local_repo_config_path }}"
    overall_status_dict: "{{ overall_status_dict }}"
    show_softwares_status: "{{ true | bool }}"
  register: status_results
  when: overall_status_dict is defined and overall_status_dict | length > 0

- name: Print overall software status
  ansible.builtin.debug:
    msg: "{{ status_results.msg.split('\n') if status_results.msg is defined else sw_download_msg }}"

- name: Display total playbook execution time in minutes and seconds
  ansible.builtin.debug:
    msg: >
      Total playbook execution time: {{
        ((lookup('pipe', 'date +%s') | int - playbook_start_time | int) // 60)
      }} min and {{
        ((lookup('pipe', 'date +%s') | int - playbook_start_time | int) % 60)
      }} sec

- name: Local repository status
  ansible.builtin.debug:
    msg: "{{ 'localrepository SUCCESS' if final_status == 'SUCCESS' else 'Local repo setup failed — some packages didn’t download, and dependent scripts/playbooks may also fail. Refer to the localrepo logs for more details. Rerun local_repo.yml.' }}" # noqa: yaml[line-length]
  failed_when: final_status != 'SUCCESS'


================================================
FILE: local_repo/roles/parse_and_download/tasks/process_rpm_repo.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Prepare software packages tasklist
  prepare_tasklist:
    csv_file_path: "{{ base_path }}/{{ cluster_os_type }}/{{ cluster_os_version }}"
    user_json_file: "{{ user_json_file }}"
    local_repo_config_path: "{{ local_repo_config_path }}"
    log_dir: "{{ base_path }}/{{ cluster_os_type }}/{{ cluster_os_version }}"
    key_path: "{{ project_input_path }}"
    sub_urls: "{{ sub_final_repo_urls }}"
  register: result

- name: Process URL mirrors from local_repo_config
  process_rpm_config:
    local_config: "{{ result.local_config }}"
    log_dir: "{{ base_path }}/{{ cluster_os_type }}/{{ cluster_os_version }}"
    additional_repos_config: "{{ result.additional_repos_config | default(omit) }}"
    pulp_concurrency: "{{ pulp_concurrency }}"
    sw_archs: "{{ result.sw_archs }}"
    resync_repos: "{{ resync_repos | default(None) }}"
    cluster_os_version: "{{ cluster_os_version }}"
  register: rpm_result

- name: Display RPM processing result
  ansible.builtin.debug:
    msg: "{{ rpm_result.result }}"

- name: Regenerate DNF cache
  ansible.builtin.dnf:
    update_cache: true
  changed_when: false


================================================
FILE: local_repo/roles/parse_and_download/templates/local_repo_access.yml.j2
================================================
offline_tarball_path: "{{ hostvars['oim']['pulp_protocol'] }}://{{ pulp_server_ip }}:{{ hostvars['oim']['pulp_server_port'] }}/pulp/content/opt/omnia/offline_repo/cluster/x86_64/{{ cluster_os_type }}/{{ cluster_os_version }}/tarball"
offline_shell_path: "{{ hostvars['oim']['pulp_protocol'] }}://{{ pulp_server_ip }}:{{ hostvars['oim']['pulp_server_port'] }}/pulp/content/opt/omnia/offline_repo/cluster/x86_64/{{ cluster_os_type }}/{{ cluster_os_version }}/shell"
offline_pip_module_path: "{{ hostvars['oim']['pulp_protocol'] }}://{{ pulp_server_ip }}:{{ hostvars['oim']['pulp_server_port'] }}/pulp/content/opt/omnia/offline_repo/cluster/x86_64/{{ cluster_os_type }}/{{ cluster_os_version }}/pip_module"
offline_git_path: "{{ hostvars['oim']['pulp_protocol'] }}://{{ pulp_server_ip }}:{{ hostvars['oim']['pulp_server_port'] }}/pulp/content/opt/omnia/offline_repo/cluster/x86_64/{{ cluster_os_type }}/{{ cluster_os_version }}/git"
offline_ansible_galaxy_collection_path: "{{ hostvars['oim']['pulp_protocol'] }}://{{ pulp_server_ip }}:{{ hostvars['oim']['pulp_server_port'] }}/pulp/content/opt/omnia/offline_repo/cluster/x86_64/{{ cluster_os_type }}/{{ cluster_os_version }}/ansible_galaxy_collection"
offline_manifest_path: "{{ hostvars['oim']['pulp_protocol'] }}://{{ pulp_server_ip }}:{{ hostvars['oim']['pulp_server_port'] }}/pulp/content/opt/omnia/offline_repo/cluster/x86_64/{{ cluster_os_type }}/{{ cluster_os_version }}/manifest"
offline_iso_path: "{{ hostvars['oim']['pulp_protocol'] }}://{{ pulp_server_ip }}:{{ hostvars['oim']['pulp_server_port'] }}/pulp/content/opt/omnia/offline_repo/cluster/x86_64/{{ cluster_os_type }}/{{ cluster_os_version }}/iso"
oim_hostname: "{{ oim_hostname }}"
domain_name: "{{ domain_name }}"
proxy_status: false
no_proxy_input_status: false
user_no_proxy: ""


================================================
FILE: local_repo/roles/parse_and_download/vars/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

omnia_metadata_file: "/opt/omnia/.data/oim_metadata.yml"
local_repo_access_src_path: "{{ role_path }}/templates/local_repo_access.yml.j2"
provision_shared_path: "/opt/omnia/provision"
local_repo_access_dest_path: "{{ provision_shared_path }}/local_repo_access.yml"
nfs_shared_path: "/opt/omnia"
repo_store_path: "{{ nfs_shared_path }}"
base_path: "{{ nfs_shared_path }}/log/local_repo"
csv_base_path:
  - "{{ nfs_shared_path }}/log/local_repo/x86_64"
  - "{{ nfs_shared_path }}/log/local_repo/aarch64"
local_repo_config_path: "{{ project_input_path }}/local_repo_config.yml"
sw_config_json_path: "{{ project_input_path }}/software_config.json"
functional_groups_config_path: "{{ nfs_shared_path }}/.data/functional_groups_config.yml"
user_json_file: "{{ project_input_path }}/software_config.json"
# user_reg_cred_input: "{{ project_input_path }}/user_registry_credential.yml"
# user_reg_key_path: "{{ project_input_path }}/.local_repo_credentials_key"
omnia_credentials_yaml_path: "{{ project_input_path }}/omnia_config_credentials.yml"
omnia_credentials_vault_path: "{{ project_input_path }}/.omnia_config_credentials_key"
clean_rpms: true
rpm_dir_path: "{{ repo_store_path }}/offline_repo/cluster/{{ item }}/rhel/{{ cluster_os_version }}/rpm"
localrepo_completion_msg1: |
  The playbook local_repo.yml has completed successfully.
  To build the node images, execute the appropriate playbook based on the target architecture:
  - For **x86_64** nodes, run:  `build_image_x86_64/build_image_x86_64.yml`
# Pulp concurrency for sync/publish operations
# For NFS storage: Use 1 (prevents 500/502/504 errors)
# For local storage: Use 2 for optimal performance
# For high-performance SAN: Can try 3-4 (monitor for errors)
pulp_concurrency: 1
# Resync repos control
# - null/omit: Skip already synced repos (default)
# - "all": Force resync all repos
# - ["repo1", "repo2"]: Only sync specified repos
# resync_repos: null
local_repo_py_module_vars:
  default_vars: &sw_defaults
    timeout: 7200  # Timeout in seconds for each thread
    nthreads: 8 # Number of threads
  amdgpu:
    <<: *sw_defaults
  default_packages:
    timeout: 7200
    nthreads: 1
  openldap:
    timeout: 7200
    nthreads: 2
  nfs:
    timeout: 7200
    nthreads: 1
  service_k8s:
    timeout: 7200
    nthreads: 8
  slurm_custom:
    timeout: 7200
    nthreads: 3
  ucx:
    timeout: 7200
    nthreads: 2
  openmpi:
    timeout: 7200
    nthreads: 2
  csi_driver_powerscale:
    timeout: 7200
    nthreads: 6

sw_download_msg: "The specified software packages have already been downloaded."
# Usage create_metadata.yml
meta_dest: "{{ nfs_shared_path }}/offline_repo/.data"
metadata_file_path: "{{ meta_dest }}/localrepo_metadata.yml"
metadata_warn_msg: "Warning: Metadata has changed since the last run! execution may fail if there is no internet on OIM , still you want to continue..."
metadata_identical_msg: "Metadata is identical. No changes detected."
file_mode: "0644"
folder_mode: "0755"


================================================
FILE: local_repo/roles/pulp_validation/tasks/check_pulp_status.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

---
- name: Get dependencies from local repo
  block:
    - name: Gather facts on Pulp container
      containers.podman.podman_container_info:
        name: "{{ pulp_container_name }}"
      register: container_info

    - name: Success if pulp container is running
      ansible.builtin.debug:
        msg: "{{ pulp_container_success_msg }}"
      when:
        - container_info.containers | length > 0
        - container_info.containers[0].State.Status == 'running'

    - name: Fail if pulp container is not running
      ansible.builtin.fail:
        msg: "{{ pulp_container_fail_msg }}"
      when:
        - container_info.containers | length == 0 or container_info.containers[0].State.Status != 'running'

- name: Run pulp status command on omnia_core container
  ansible.builtin.command: /usr/local/bin/pulp status
  delegate_to: localhost
  changed_when: false
  register: pulp_status_output

- name: Set pulp content origin value
  ansible.builtin.set_fact:
    pulp_content_origin: "{{ (pulp_status_output.stdout | from_json).content_settings.content_origin }}"

- name: Set fact for pulp protocol
  ansible.builtin.set_fact:
    pulp_protocol: "{{ pulp_content_origin | urlsplit('scheme') | lower }}"
    pulp_server_ip: "{{ pulp_content_origin | urlsplit('hostname') }}"
    pulp_server_port: "{{ pulp_content_origin | urlsplit('port') }}"

- name: Check if Pulp endpoint is up
  block:
    - name: Check if Pulp endpoint is up
      ansible.builtin.uri:
        url: "{{ pulp_status_url }}"
        method: GET
        validate_certs: false
        return_content: true
      register: result
      retries: "{{ endpoint_retries }}"
      delay: "{{ endpoint_delay }}"
      timeout: "{{ endpoint_timeout }}"
      until: result.status == 200

    - name: Fail when Pulp endpoint is not up
      ansible.builtin.debug:
        msg: "{{ pulp_status_fail_msg }}"
      when: result.status != 200


================================================
FILE: local_repo/roles/pulp_validation/tasks/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

---
- name: Check if Pulp container and endpoint is up and running
  ansible.builtin.include_tasks: check_pulp_status.yml


================================================
FILE: local_repo/roles/pulp_validation/tasks/read_network_spec.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

---
- name: Include network_spec.yml
  block:
    - name: Include network_spec file
      ansible.builtin.include_vars: "{{ network_spec }}"
      register: include_network_spec
      no_log: true
      tags: init
  rescue:
    - name: Failed to include network_spec.yml
      ansible.builtin.fail:
        msg: "{{ network_spec_syntax_fail_msg }} Error: {{ include_network_spec.message }}"

- name: Parse network_spec data
  ansible.builtin.set_fact:
    network_data: "{{ network_data | default({}) | combine({item.key: item.value}) }}"
  with_dict: "{{ Networks }}"

- name: Set admin network nic and ip
  ansible.builtin.set_fact:
    pulp_server_ip: "{{ network_data.admin_network.primary_oim_admin_ip }}"


================================================
FILE: local_repo/roles/pulp_validation/vars/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

---
# read_network_spec.yml
network_spec: "{{ input_project_dir }}/network_spec.yml"
network_spec_syntax_fail_msg: "Failed. Syntax errors present in network_spec.yml. Fix errors and re-run playbook again."

# check_pulp_status.yml
pulp_container_name: "pulp"
pulp_status_url: "{{ pulp_protocol }}://{{ pulp_server_ip }}:{{ pulp_server_port }}/pulp/api/v3/status/"
endpoint_retries: 3
endpoint_delay: 5
endpoint_timeout: 60

pulp_status_fail_msg: "Pulp endpoint is not up. Status code: {{ result.status }}"
pulp_container_success_msg: "The {{ pulp_container_name }} container is up and running."
pulp_container_fail_msg: "The Pulp Container is not found on the OIM. Please run prepare_oim.yml first, and then rerun local_repo.yml"


================================================
FILE: local_repo/roles/validation/tasks/check_additional_packages_images.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Load local_repo_config.yml
  ansible.builtin.include_vars:
    file: "{{ local_repo_config_file }}"
    name: local_repo_config

- name: Check if additional_packages is enabled in software_config
  ansible.builtin.set_fact:
    additional_packages_enabled: "{{ software | selectattr('name', 'equalto', 'additional_packages') | list | length > 0 }}"

- name: Get additional_packages architectures
  ansible.builtin.set_fact:
    additional_packages_archs: "{{ (software | selectattr('name', 'equalto', 'additional_packages') | first).arch | default([]) }}"
  when: additional_packages_enabled

- name: Check for image packages in additional_packages.json
  when: additional_packages_enabled
  block:
    - name: Initialize image found flag
      ansible.builtin.set_fact:
        has_image_packages: false

    - name: Check each architecture for image packages
      ansible.builtin.include_tasks: check_images_per_arch.yml
      loop: "{{ additional_packages_archs }}"
      loop_control:
        loop_var: arch_item
      when: additional_packages_archs is defined

    - name: Display warning if images found in additional_packages.json but user_registry not defined
      ansible.builtin.pause:
        prompt: "{{ additional_packages_image_warning_msg }}"
        seconds: "{{ warning_wait_time_warning }}"
      when:
        - has_image_packages | bool
        - local_repo_config.user_registry is not defined or local_repo_config.user_registry is none or local_repo_config.user_registry | length == 0


================================================
FILE: local_repo/roles/validation/tasks/check_images_per_arch.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Set additional_packages.json path for {{ arch_item }}
  ansible.builtin.set_fact:
    additional_packages_path: "{{ project_input_path }}/config/{{ arch_item }}/{{ cluster_os_type }}/{{ cluster_os_version }}/additional_packages.json"

- name: Check if additional_packages.json exists for {{ arch_item }}
  ansible.builtin.stat:
    path: "{{ additional_packages_path }}"
  register: additional_packages_file

- name: Load and check additional_packages.json for {{ arch_item }}
  when: additional_packages_file.stat.exists
  block:
    - name: Load additional_packages.json
      ansible.builtin.include_vars:
        file: "{{ additional_packages_path }}"
        name: additional_packages_data

    - name: Check for image type packages in additional_packages
      ansible.builtin.set_fact:
        has_image_packages: true
      when: >
        additional_packages_data | dict2items |
        selectattr('value.cluster', 'defined') |
        map(attribute='value.cluster') |
        flatten |
        selectattr('type', 'defined') |
        selectattr('type', 'equalto', 'image') |
        list | length > 0


================================================
FILE: local_repo/roles/validation/tasks/display_msg.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Show warning if 'softwares' is not defined
  ansible.builtin.debug:
    msg: "{{ usage_message.splitlines() }}"
  when: softwares is not defined

- name: Pause for 30 seconds to let user read the warning
  ansible.builtin.pause:
    seconds: 30
  when: softwares is not defined


================================================
FILE: local_repo/roles/validation/tasks/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
- name: Define project input path
  ansible.builtin.set_fact:
    project_input_path: "{{ hostvars['localhost']['input_project_dir'] }}"

- name: Install prerequisites
  ansible.builtin.include_tasks: prerequisites.yml

- name: Validate software_config.json
  ansible.builtin.include_tasks: validate_software_config_json.yml

- name: Check for images in additional_packages
  ansible.builtin.include_tasks: check_additional_packages_images.yml

- name: Validate metadata
  ansible.builtin.include_tasks: validate_metadata.yml

- name: Validate user_repo certificates
  validate_user_repo:
    certs_path: "{{ user_repo_cert_dir }}"
    local_repo_config_path: "{{ local_repo_config_file }}"
    repo_key: "user_repo_url"
  register: cert_check_result
  failed_when: cert_check_result.failed | default(false)

- name: Check user registry reachability
  check_user_registry:
    config_file: "{{ local_repo_config_file }}"
    # user_reg_cred_input: "{{ user_reg_cred_input }}"
    # user_reg_key_path: "{{ user_reg_key_path }}"
    timeout: "{{ time_out }}"
  register: registry_check_result

- name: Fail - Unreachable registries detected
  ansible.builtin.fail:
    msg: "{{ unreachable_registries_fail_msg }}"
  when:
    - registry_check_result.unreachable_registries is defined
    - registry_check_result.unreachable_registries | length > 0


================================================
FILE: local_repo/roles/validation/tasks/prerequisites.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Set MaxParallelDownloads for dnf
  community.general.ini_file:
    path: "{{ dnf_conf_path }}"
    section: main
    option: "{{ item[0] }}"
    value: "{{ item[1] }}"
    backup: true
    no_extra_spaces: true
    mode: "{{ dnf_max_mode }}"
  loop:
    - "{{ ['max_parallel_downloads', dnf_max_parallel] }}"
    - "{{ ['strict', 'False'] }}"


================================================
FILE: local_repo/roles/validation/tasks/validate_metadata.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Check if metadata file exists
  ansible.builtin.stat:
    path: "{{ metadata_file_path }}"
  register: metadata_file

- name: Process the metadata if the file exists
  when: metadata_file.stat.exists
  block:
    - name: Process the metadata if the file exists
      localrepo_metadata_manager:
        software_config_path: "{{ sw_config_json_path }}"
        localrepo_config_path: "{{ local_repo_config_path }}"
        output_file: "{{ metadata_file_path }}"
      register: metadata_compare
      when: metadata_file.stat.exists

    - name: Print metadata is identical or not
      ansible.builtin.debug:
        msg: "{{ metadata_identical_msg }}"
      when: metadata_compare.identical

    - name: Prompt for user confirmation
      ansible.builtin.pause:
        prompt: |
          {{ metadata_warn_msg }}
          Do you want to continue? (yes/no)
      register: user_input
      when:
        - not metadata_compare.identical
        - not (enable_build_stream | default(false) | bool)

    - name: Auto-continue when build stream is enabled
      ansible.builtin.debug:
        msg: "{{ build_stream_auto_accept_metadata_msg }}"
      when:
        - not metadata_compare.identical
        - enable_build_stream | default(false) | bool

    - name: Fail if user chooses not to continue
      ansible.builtin.fail:
        msg: "User choose not to continue due to metadata change."
      when:
        - not metadata_compare.identical
        - not (enable_build_stream | default(false) | bool)
        - user_input.user_input | lower != 'yes'


================================================
FILE: local_repo/roles/validation/tasks/validate_software_config_json.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
- name: Load software_config.json
  ansible.builtin.include_vars:
    file: "{{ sw_config_json_path }}"
    name: software_config

- name: Set facts for cluster
  ansible.builtin.set_fact:
    cluster_os_type: "{{ software_config.cluster_os_type }}"
    cluster_os_version: "{{ software_config.cluster_os_version }}"
    repo_config: "{{ software_config.repo_config }}"
    software: "{{ software_config.softwares }}"

- name: Check if compute_k8s support is true
  ansible.builtin.set_fact:
    compute_k8s_support: "{{ software_config.softwares | selectattr('name', 'equalto', 'compute_k8s') | list | length > 0 }}"

- name: Check if service k8s support is true
  ansible.builtin.set_fact:
    service_k8s_support: "{{ software_config.softwares | selectattr('name', 'equalto', 'service_k8s') | list | length > 0 }}"
    software_names: "{{ software_config.softwares | map(attribute='name') | select('defined') | list }}"
    software_json_list: "{{ software_names | map('regex_replace', '$', '.json') | list }}"

- name: Get k8s archs
  ansible.builtin.set_fact:
    service_k8s_arch: "{{ (software_config.softwares | selectattr('name', 'equalto', 'service_k8s') | first).get('arch', default_archs) }}"
  when: service_k8s_support

- name: Get k8s archs
  ansible.builtin.set_fact:
    k8s_arch: "{{ (software_config.softwares | selectattr('name', 'equalto', 'k8s') | first).get('arch', default_archs) }}"
  when: k8s_support

- name: Validation for version property for softwares mentioned in software_config.json
  block:
    - name: Validation of version property for specific softwares
      ansible.builtin.assert:
        that:
          - item.name not in specific_softwares or (item.version is defined and item.version != "")
      loop: "{{ software_config.softwares + software_config.amdgpu + software_config.bcm_roce | default([]) }}"
      when: item.name is defined
      loop_control:
        loop_var: item
      failed_when: false
      register: version_result

    - name: Show failed version assertions
      ansible.builtin.fail:
        msg: "{{ item.msg }}"
      loop: "{{ version_result.results }}"
      when: item.evaluated_to is false

  rescue:
    - name: Versions were not defined for softwares
      ansible.builtin.fail:
        msg: "{{ versions_fail_msg }}"
      vars:
        failed_softwares: "{{ version_result.results | selectattr('msg', 'equalto', 'Assertion failed') | map(attribute='item.name') | list }}"

- name: Update software versions from software_config.json (softwares)
  ansible.builtin.set_fact:
    "{{ item.name }}_version": "{{ item.version }}"
  loop: "{{ software_config.softwares | default([]) }}"
  when: item.version is defined
  loop_control:
    loop_var: item

- name: Update software versions from software_config.json (custom)
  ansible.builtin.set_fact:
    "{{ item.name }}_version": "{{ item.version }}"
  loop: "{{ software_config.custom | default([]) }}"
  when: item.version is defined
  loop_control:
    loop_var: item

- name: Fail if service_k8s_version is not supported
  ansible.builtin.fail:
    msg: "{{ fail_msg }}"
  when:
    - service_k8s_support
    - service_k8s_version != default_k8s_version


================================================
FILE: local_repo/roles/validation/vars/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
# default variables
beegfs_version: "omnia_default"
amdgpu_version: "omnia_default"
rocm_version: "omnia_default"
bcm_roce_libraries_version: "omnia_default"
intelgaudi_version: "omnia_default"
k8s_support: false
service_k8s_support: false
k8s_arch: []
service_k8s_arch: []
cluster_configs: []

# Usage: update_software_csv.yml
software_csv_path: "/opt/omnia/log/local_repo/software.csv"
usage_message: |
  "WARNING:
  If you have modified any <software_name>.json file (e.g., `additional_software.json`),
  please run this playbook using:
    ansible-playbook local_repo.yml -e "softwares=<list of softwares names seprated by comma>"

  Example:
    ansible-playbook local_repo.yml -e "softwares=additional_software"
    ansible-playbook local_repo.yml -e "softwares=compute_k8s,slurm"

  If you have NOT modified any software JSON files, you can run:
    ansible-playbook local_repo.yml"
softwares_var_not_provided: "No softwares variable provided. Skipping."
softwares_invalid_msg: "Invalid software_name(s) found: {{ softwares_list | difference(software_names) }}. Allowed values: {{ software_names }}"

# Usage: main.yml
nfs_shared_path: "/opt/omnia"
local_repo_config_file: "{{ project_input_path }}/local_repo_config.yml"
# user_reg_cred_input: "{{ project_input_path }}/user_registry_credential.yml"
# user_reg_key_path: "{{ project_input_path }}/.local_repo_credentials_key"
var_mount_percentage_limit: 80
var_mount_overuse_msg: |
  [WARNING] local_repo.yml may fail as /var mount usage has exceeded the limit of {{ var_mount_percentage_limit }}%.
  Current usage: {{ var_mount_use_percentage.stdout }}%.
  This could result in failures when downloading large packages or images.

  For OMNIA disk spaces requirements follow : https://omnia-doc.readthedocs.io/en/latest
user_repo_cert_dir: "{{ nfs_shared_path }}/user_repo_certs"
software_cleanup_list:
  - name: 'k8s'
    version: "{{ k8s_version | default('') }}"
    enabled: "{{ k8s_support | default(false) }}"
  - name: 'service_k8s'
    version: "{{ service_k8s_version | default('') }}"
    enabled: "{{ service_k8s_support | default(false) }}"

# Usage: prerequisites_redhat.yml, prerequisites_ubuntu.yml
max_retries: 10
yum_repos_path: "/etc/yum.repos.d"
yum_conf_path: "/etc/yum.conf"
dnf_conf_path: "/etc/dnf/dnf.conf"
dnf_max_parallel: 10
dnf_max_mode: "0644"

python_version: "{{ ansible_python_interpreter }}"
apt_conf_dest: /etc/apt/apt.conf

root_user_name: "root"
user_fail_msg: "Failed. Omnia playbooks should run as root user."
warning_wait_time_warning: 15
warning_msg_local_repo: "[WARNING] Omnia will remove any package/software conflicting with the requirements."

# Usage: check_rhel_subscription.yml
rhel_repo_cert_dir: "{{ hostvars['localhost']['oim_shared_path'] }}/omnia/rhel_repo_certs"
omnia_rhel_cert_dir: "/opt/omnia/rhel_repo_certs"  # Define NFS share path
rhel_version: "{{ hostvars['localhost']['cluster_os_version'].split('.')[0] }}"
required_repos:
  - codeready-builder
  - baseos
  - appstream
redhat_uep_cert: "/etc/rhsm/ca/redhat-uep.pem"
entitlement_path: "/etc/pki/entitlement"
redhat_repo_file: "/etc/yum.repos.d/redhat.repo"

# Usage: validate_software_config_json.yml
sw_config_json_path: "{{ project_input_path }}/software_config.json"
software_config_parameters_fail_msg: "Failed. Please ensure cluster_os_type, cluster_os_verion, repo_config, softwares are defined in software_config.json"
software_config_softwares_fail_msg: "Failed. softwares list cannot be empty in software_config.json. Atleast one software should be defined."
specific_softwares:
  - 'beegfs'
  - 'amdgpu'
  - 'compute_k8s'
  - 'cuda'
  - 'ofed'
  - 'bcm_roce'
  - 'ucx'
  - 'rocm'
  - 'intelgaudi'
  - 'openmpi'
  - 'bcm_roce_libraries'
default_k8s_version: "1.34.1"
fail_msg: >-
    service_k8s is not supported for version: {{ service_k8s_version }}.
    Please update the service_k8s version in software_config.json to {{ default_k8s_version }}
    and rerun the playbook.

versions_fail_msg: "Versions were not defined for the following softwares: {{ failed_softwares | join(', ') }} in software_config.json.
    Refer examples/template_{{ cluster_os_type }}_software_config.json and define version details accordingly in {{ project_input_path }}/software_config.json"
cluster_os_type_fail_msg: "Failed. The supported values of cluster_os_type is Fedora"
cluster_os_version_fail_msg_fedora: "Failed. The supported values of cluster_os_version is 38 when cluster_os_type is Fedora"
# cross_os_support_fail_msg: "Cross-OS is not supported: control_plane_os '{{ control_plane_os }}' does not match cluster_os_type '{{ cluster_os_type }}'"
valid_cluster_os_type:
  - 'fedora'
rhel_valid_os_versions:
  - '10.0'
  - '10.1'
rocky_valid_os_versions:
  - '10.0'
  - '10.1'

valid_repo_config:
  - 'always'
  - 'partial'
  - 'never'

# Usage: validate_composable_role_config.yml
fail_msg_composable_config_file: "composable_role_config.yml file doesn't exist."
# Usage: validate_local_repo_config.yml
input_project_dir: "{{ hostvars['localhost']['input_project_dir'] }}"
local_repo_config_syntax_fail_msg: "Failed. Syntax errors present in local_repo_config.yml. Fix errors and re-run playbook again."
repo_store_path_fail_msg: "Failed. Ensure repo_store_path is defined and it should start with '/' and should not end with '/'"
directory_permissions: "0755"
omnia_registry_fail_msg: "Failed. omnia_registry should be defined in local_repo_config.yml."
omnia_registry_string_fail_msg: "Each item in omnia_registry should be a string."

# Usage: validate_user_registry.yml
user_registry_fail_msg: "Failed. Please ensure user_registry is non empty list and
    check if there is any indentation error in {{ project_input_path }}/local_repo_config.yml"
user_registry_fail_host_cert_path_msg: "Failed. Each item in user_registry should have 'host' and 'cert_path' keys defined"
time_out: 30
user_registry_msg: "Above user registries is/are not reachable. Please make sure the user registry is accessible from the Omnia Infrastructure Manager."   # noqa: yaml[line-length]
unreachable_registries_fail_msg: "Unreachable registries detected: {{ registry_check_result.unreachable_registries | join(', ') }}. {{ user_registry_msg }} Please check registry connectivity and configuration before proceeding."  # noqa: yaml[line-length]
cert_path_failure_msg: "Certificate file path {{ item.item.cert_path }} does not exist on the Omnia Infrastructure Manager for host {{ item.item.host }}. Please verify that correct cert_path is given in {{ project_input_path }}/local_repo_config.yml"  # noqa: yaml[line-length]
additional_packages_image_warning_msg: |
  WARNING: additional_packages.json contains packages of type 'image', but 'user_registry' is not defined in local_repo_config.yml.
  Please specify 'user_registry' in local_repo_config.yml if these images are coming from a user registry.

# Usage: validate_user_repo_url.yml
user_repo_url_fail_msg: "Failed. Please ensure user_repo_url is proper and should not have jinja variables.
    Also ensure that there is no indentation error in {{ project_input_path }}/local_repo_config.yml"
user_repo_url_fail_url_gpg_key_msg: "Failed. Each item in user_repo_url should have 'url', 'gpgkey' and 'name' keys defined"

# Usage: validate_json_path.yml
json_files_directory: "{{ project_input_path }}/config/{{ cluster_os_type }}/{{ cluster_os_version }}"

# Usage: validate_json_subgroup_file.yml
subgroup_software_name_fail_msg: "Please ensure valid software names are defined in subgroups in the software_config.json file."

# Usage: validate_ubuntu_os_url.yml
url_format_fail_msg: "Failed. Invalid format for ubuntu_os_url.
    Also ensure that there is no indentation error in {{ project_input_path }}/local_repo_config.yml"
url_unreachable_fail_msg: "Failed. Unreachable url {{ ubuntu_os_url }} input provided in ubuntu_os_url.
    This can be due to intermittent internet connectivity issues as well.
    Please ensure that the url mentioned in ubuntu_os_url is reachable and re-run local_repo.yml."
http_key: http

# Usage: validate_metadata.yml
meta_dest: "{{ nfs_shared_path }}/offline_repo/.data"
metadata_file_path: "{{ meta_dest }}/localrepo_metadata.yml"
build_stream_auto_accept_metadata_msg: "Build stream is enabled, automatically accepting metadata changes."

# Usage: remove_k8s_line.yml
software_csv_file_path: "/opt/omnia/log/local_repo/software.csv"
k8s_local_repo_metadata_file_path: "/opt/omnia/log/local_repo/k8s_local_repo_metadata.yml"

# Usage: validate_rhel_os_url.yml
rhel_os_url_fail_msg: "Failed. Please ensure rhel_os_url is non empty list and
    check if there is any indentation error for variable names in {{ project_input_path }}/local_repo_config.yml"
rhel_os_url_fail_url_gpg_key_msg: "Failed. Each item in rhel_os_url should have 'url', 'gpgkey' and 'name' keys defined"

# Usage: validate_bcm_roce.yml
bcm_roce_json_file: "{{ project_input_path }}/config/{{ cluster_os_type }}/{{ cluster_os_version }}/bcm_roce.json"
fail_msg_bcm_roce_json_file: "bcm_roce.json file is absent. Broadcom RoCE driver packages will not be downloaded."
bcm_roce_fail_msg: "bcm_roce is provided in software_config.json but neither url nor path is provided in bcm_roce.json file in
    {{ project_input_path }}/config/{{ cluster_os_type }}/{{ cluster_os_version }}/"
bcm_roce_file_path_missing_msg: "Incorrect bcm_roce_file_path provided. Make sure bcm_roce file is present in the provided
 bcm_roce path."
bcm_roce_file_path_success_msg: "bcm_roce_file_path validated"
bcm_roce_file_path_fail_msg: "Failed. The path provided for bcm_roce file is not a tarball. please provide a valid tarball."
bcm_roce_src_warning_msg: "bcm_roce_libraries will not be installed on the nodes post provisioning. bcm_roce is provided in software_config.json
 but neither url nor path is provided in bcm_roce.json file in {{ project_input_path }}/config/{{ cluster_os_type }}/{{ cluster_os_version }}/"
bcm_roce_src_file_path_missing_msg: "Incorrect bcm_roce_libraries file_path provided. Make sure bcm_roce file is present in the provided
 bcm_roce path."
bcm_roce_src_file_path_success_msg: "bcm_roce_libraries file_path validated"
bcm_roce_src_file_path_fail_msg: "Failed. The path provided for bcm_roce_libraries file is not a tarball. please provide a valid tarball."
file_permission: "0755"
bcm_roce_driver_temp: /opt/omnia/.bcm_roce/driver
bcm_roce_source_temp: /opt/omnia/.bcm_roce/source
bcm_roce_driver_fail_msg: "Failed. The provided tarball does not have netxtreme-peer-mem deb packages, please provide a valid driver tarball."
bcm_roce_source_fail_msg: "Failed. The provided tarball does not have bnxt libraries, please provide a valid libraries tarball."
search_patterns:
  - "*netxtreme-bnxt_en*.tar.*"
  - "*libbnxt_re*.tar.*"
subgroup_missing_warning_msg: "bcm_roce mentioned in software_config.json, but bcm_roce sub-group is not available.
 bcm_roce_libraries will not be installed on the nodes post provisioning."
subgroup_warning_msg: "bcm_roce_libraries attribute is not mentioned in the bcm_roce sub-group in software_config.json,
 so bcm_roce_libraries will not be installed on the nodes post provisioning."
bcm_roce_libraries_warning_msg: "bcm_roce_libraries object not found in bcm_roce.json,
 so bcm_roce_libraries will not be installed during post provisioning."


================================================
FILE: omnia.sh
================================================
#!/bin/bash

# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.


# This script is used to generate the Omnia core docker image.
# The image is based on Fedora and uses systemd to start all of the necessary
# services.
#
# This script prompts the user for the Omnia shared path and the root
# password. It then checks if the Omnia shared path exists.
#
# The script checks if the ssh key file exists. If it does not exist, a new ssh

# Color Definitions
RED='\033[0;31m'
GREEN='\033[0;32m'
BLUE='\033[0;34m'
NC='\033[0m' # No Color
YELLOW='\033[0;33m'

# Function to get version from git tag
get_version_from_git_tag() {
    local tag_version
    local script_dir
    local git_root
    
    # First try to get script directory
    if [ -L "${BASH_SOURCE[0]}" ]; then
        # If script is a symlink, resolve it
        script_dir="$(cd "$(dirname "$(readlink -f "${BASH_SOURCE[0]}")")" && pwd)"
    else
        script_dir="$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)"
    fi
    
    # Find git repository by traversing up from script directory
    git_root="$script_dir"
    while [ "$git_root" != "/" ] && [ ! -d "$git_root/.git" ]; do
        git_root="$(dirname "$git_root")"
    done
    
    # If we found a git repository, run git command
    if [ "$git_root" != "/" ] && [ -d "$git_root/.git" ]; then
        tag_version=$(cd "$git_root" && git tag --points-at HEAD 2>/dev/null | head -n 1)
    else
        tag_version=""
    fi
    
    if [ -z "$tag_version" ]; then
        echo ""
        return 1
    fi
    
    # If tag starts with 'v', strip it and return the rest
    if [[ "$tag_version" =~ ^v(.+)$ ]]; then
        echo "${BASH_REMATCH[1]}"
        return 0
    fi
    
    # Tag doesn't start with 'v', return as-is
    echo "$tag_version"
    return 0
}

# Function to validate version string format
validate_version_string() {
    local version="$1"
    
    # Check if version is empty
    if [ -z "$version" ]; then
        return 1
    fi
    
    # Basic version format validation: X.Y.Z.W or X.Y.Z.W-rcN or X.Y.Z.W-suffix
    if [[ "$version" =~ ^[0-9]+\.[0-9]+\.[0-9]+\.[0-9]+(-[a-zA-Z0-9]+)?$ ]]; then
        return 0
    fi
    
    return 1
}

# Function to get version for metadata (from git tag or default)
get_metadata_version() {
    local default_version="${1:-$omnia_release}"
    local git_tag_version
    
    git_tag_version=$(get_version_from_git_tag)
    
    if [ -n "$git_tag_version" ] && validate_version_string "$git_tag_version"; then
        echo "$git_tag_version"
    else
        echo "$default_version"
    fi
}

omnia_release=2.1.0.0

core_container_status=false
omnia_path=""
hashed_passwd=""
domain_name=""

is_local_ip() {
    local ip_to_check="$1"

    # Get all local IP addresses (excluding loopback)
    local local_ips
    local_ips=$(hostname -I)

    # Check if the IP matches any local IP
    if echo "$local_ips" | grep -qw "$ip_to_check"; then
        return 0  # IP is local
    else
        return 1  # IP is not local
    fi
}

# Version configuration variables
OMNIA_CORE_CONTAINER_TAG="2.1"  # Default container tag
OMNIA_VERSION=""  # Will be read from metadata
TARGET_OMNIA_VERSION=""  # Target version for upgrade
TARGET_CONTAINER_TAG=""  # Target container tag for upgrade

# Centralized version list (in chronological order)
# Note: Include RC milestones so upgrades from RC to RC/GA appear
ALL_OMNIA_VERSIONS=(
    "2.0.0.0"
    "2.1.0.0-rc1"
    "2.1.0.0-rc2"
    "2.1.0.0"
)

# Container-side paths (used inside podman exec commands)
CONTAINER_INPUT_DIR="/opt/omnia/input"
CONTAINER_BACKUPS_DIR="/opt/omnia/backups"
CONTAINER_METADATA_FILE="/opt/omnia/.data/oim_metadata.yml"

# Function to get available upgrade versions (higher than current)
get_available_upgrade_versions() {
    local current_version="$1"
    local available_versions=()
    local version_descriptions=()
    
    # Find versions higher than current
    local found_current=false
    for version in "${ALL_OMNIA_VERSIONS[@]}"; do
        if [ "$version" = "$current_version" ]; then
            found_current=true
            continue
        fi
        
        if [ "$found_current" = true ]; then
            # Skip RC targets; only offer GA paths
            if [[ "$version" == *-rc* ]]; then
                continue
            fi
            available_versions+=("$version")
            
            # Generate description based on upgrade type
            local current_tag=$(get_container_tag_from_version "$current_version")
            local target_tag=$(get_container_tag_from_version "$version")
            
            if [ "$current_tag" = "$target_tag" ]; then
                version_descriptions+=("Patch upgrade to $version (container restart only)")
            else
                version_descriptions+=("Major upgrade to $version (container swap required)")
            fi
        fi
    done
    
    # Return arrays
    printf '%s\n' "${available_versions[@]}"
    printf '%s\n' "${version_descriptions[@]}"
}

# Function to get available rollback versions (lower than current)
get_available_rollback_versions() {
    local current_version="$1"
    local normalized_current_version="${current_version%%-rc*}"
    if [ -z "$normalized_current_version" ]; then
        normalized_current_version="$current_version"
    fi
    local available_versions=()
    
    # Find versions lower than current
    for version in "${ALL_OMNIA_VERSIONS[@]}"; do
        if [ "$version" = "$normalized_current_version" ]; then
            break
        fi
        # Skip RC targets for rollback choices
        if [[ "$version" == *-rc* ]]; then
            continue
        fi
        available_versions+=("$version")
    done
    
    # Return array (reverse order for rollback - newest first)
    local reversed_versions=()
    for ((i=${#available_versions[@]}-1; i>=0; i--)); do
        reversed_versions+=("${available_versions[$i]}")
    done
    
    printf '%s\n' "${reversed_versions[@]}"
}

# Function to perform same-tag rollback (container restart only)
rollback_same_tag() {
    local target_version="$1"
    local current_version="$2"
    
    echo "[INFO] [ROLLBACK] Phase: Same-Tag Rollback"
    echo "[INFO] [ROLLBACK] Rolling back to $target_version within same container tag"
    
    # Verify container is running
    if ! podman ps --format '{{.Names}}' | grep -qw "omnia_core"; then
        echo "[ERROR] [ROLLBACK] Container is not running for same-tag rollback"
        return 1
    fi
    
    # Get version from git tag or use target version
    local metadata_version=$(get_metadata_version "$target_version")
    echo "[INFO] [ROLLBACK] Updating metadata to version $metadata_version"
    
    # Update version metadata
    if ! podman exec -u root omnia_core bash -c "
        set -e
        if [ ! -f '$CONTAINER_METADATA_FILE' ]; then
            echo '[ERROR] Metadata file not found inside container: $CONTAINER_METADATA_FILE' >&2
            exit 1
        fi
        if grep -q '^omnia_version:' '$CONTAINER_METADATA_FILE'; then
            sed -i 's/^omnia_version:.*/omnia_version: $metadata_version/' '$CONTAINER_METADATA_FILE'
        else
            echo 'omnia_version: $metadata_version' >> '$CONTAINER_METADATA_FILE'
        fi
    "; then
        echo "[ERROR] [ROLLBACK] Failed to update metadata version"
        echo "[ERROR] [ROLLBACK] Rollback failed: Could not update version metadata"
        return 1
    fi
    
    echo "[INFO] [ROLLBACK] Restarting container to apply changes..."
    
    # Restart container to apply changes
    if ! systemctl restart omnia_core.service; then
        echo "[ERROR] [ROLLBACK] Failed to restart container service"
        echo "[ERROR] [ROLLBACK] Rollback failed: Container restart failed"
        return 1
    fi
    
    # Wait for container to be healthy after restart
    echo "[INFO] [ROLLBACK] Waiting for container health check after restart (30s)"
    local health_timeout=30
    local health_count=0
    
    while [ $health_count -lt $health_timeout ]; do
        if podman ps --format '{{.Names}} {{.Status}}' | grep -E "omnia_core.*Up" | grep -q "healthy\|Up"; then
            echo "[INFO] [ROLLBACK] Container is healthy after restart"
            break
        fi
        sleep 1
        health_count=$((health_count + 1))
        echo -n "."
    done
    
    if [ $health_count -ge $health_timeout ]; then
        echo ""
        echo "[ERROR] [ROLLBACK] Container failed to become healthy within 30 seconds after restart"
        echo "[ERROR] [ROLLBACK] Rollback failed: Container health check failed"
        return 1
    fi
    
    # Verify version update
    local updated_version=$(get_current_omnia_version)
    if [ "$updated_version" != "$metadata_version" ]; then
        echo "[ERROR] [ROLLBACK] Version update verification failed"
        echo "[ERROR] [ROLLBACK] Expected: $metadata_version, Found: $updated_version"
        return 1
    fi
    
    echo "[INFO] [ROLLBACK] Same-tag rollback completed successfully"
    echo "[INFO] [ROLLBACK] Version rolled back to: $metadata_version"
    return 0
}

# Function to validate container image availability and show build instructions
validate_container_image() {
    local target_version="$1"
    local target_container_tag="$2"
    local operation="${3:-upgrade}"
    
    echo -e "${BLUE}Validating target container image: omnia_core:$target_container_tag${NC}"
    if ! podman inspect "omnia_core:$target_container_tag" >/dev/null 2>&1; then
        echo ""
        echo -e "${RED}================================================================================${NC}"
        echo -e "${RED}ERROR: Target container image not found locally${NC}"
        echo -e "${RED}================================================================================${NC}"
        echo -e "${YELLOW}Required image:${NC} omnia_core:$target_container_tag"
        echo ""
        echo -e "${YELLOW}Omnia does not pull images from Docker Hub.${NC}"
        echo -e "${YELLOW}You must build or load the container image locally before proceeding.${NC}"
        echo ""
        echo -e "${BLUE}Build the required image using the following commands:${NC}"
        echo ""
        echo -e "git clone https://github.com/dell/omnia-artifactory.git -b omnia-container-<version>"
        echo -e "${YELLOW}Note: Replace <version> with the target Omnia version (e.g., v2.1.0.0)${NC}"
        echo ""
        echo -e "cd omnia-artifactory"
        echo ""
        echo -e "./build_images.sh core core_tag=<tag> omnia_branch=<branch>"
        echo -e "${YELLOW}Note: Replace <branch> with the target Omnia branch (e.g., v2.1.0.0)${NC}"
        echo -e "${YELLOW}Note: core_tag <tag> will be the first 2 digits of the target Omnia version (e.g., 2.1 for v2.1.0.0)${NC}"
        echo ""
        echo -e "${BLUE}After the image is built successfully, re-run:${NC}"
        echo -e "./omnia.sh --$operation"
        echo ""
        echo -e "${RED}================================================================================${NC}"
        return 1
    fi
    
    echo -e "${GREEN}✓ Target image available locally: omnia_core:$target_container_tag${NC}"
    return 0
}

# Function to get container tag from omnia version
get_container_tag_from_version() {
    local version="$1"

    # Explicit mapping: 2.1.0.0-rc1 stays on pre-GA tag 1.0
    if [[ "$version" == "2.1.0.0-rc1" ]]; then
        echo "1.0"
        return
    fi

    case "$version" in
        2.0.*)
            echo "1.0"
            ;;
        *)
            # All other versions (including rc2/GA) use major.minor as tag
            echo "$(echo "$version" | awk -F. '{print $1"."$2}')"
            ;;
    esac
}

# Function to read current omnia version from metadata
get_current_omnia_version() {
    if podman ps --format '{{.Names}}' | grep -qw "omnia_core"; then
        podman exec omnia_core cat /opt/omnia/.data/oim_metadata.yml 2>/dev/null | grep "omnia_version:" | awk '{print $2}' | tr -d '"'
    else
        echo ""
    fi
}

# Update metadata with git tag version from inside container
update_metadata_with_git_tag() {
    local default_version="${1:-$omnia_release}"

    podman exec -u root omnia_core bash -c '
        set -e

        cd /omnia || exit 0
        git_tag_version=$(git tag --points-at HEAD 2>/dev/null | head -n 1 || true)

        if [[ "$git_tag_version" =~ ^v(.+)$ ]]; then
            git_tag_version="${BASH_REMATCH[1]}"
        fi

        if [[ "$git_tag_version" =~ ^[0-9]+\.[0-9]+\.[0-9]+\.[0-9]+(-[a-zA-Z0-9]+)?$ ]]; then
            metadata_version="$git_tag_version"
        else
            metadata_version="'"$default_version"'"
        fi

        if [ -f '"'$CONTAINER_METADATA_FILE'"' ]; then
            if grep -q "^omnia_version:" '"'$CONTAINER_METADATA_FILE'"'; then
                sed -i "s/^omnia_version:.*/omnia_version: $metadata_version/" '"'$CONTAINER_METADATA_FILE'"'
            else
                echo "omnia_version: $metadata_version" >> '"'$CONTAINER_METADATA_FILE'"'
            fi
            echo "[INFO] Updated omnia_version to: $metadata_version"
        fi
    ' || true
}

show_post_upgrade_instructions() {
    local upgraded_version="$1"

    echo ""
    echo -e "${YELLOW}================================================================================${NC}"
    echo -e "${YELLOW}                    IMPORTANT POST-UPGRADE STEP${NC}"
    echo -e "${YELLOW}================================================================================${NC}"
    echo ""
    echo -e "${BLUE}NEXT REQUIRED ACTION:${NC}"
    echo -e "${YELLOW}You must now run the upgrade playbook inside the omnia_core container:${NC}"
    echo ""
    echo -e "${GREEN}ansible-playbook /omnia/upgrade/upgrade_omnia.yml${NC}"
    echo ""
    echo -e "${BLUE}This playbook will:${NC}"
    echo -e "• Update input files based on the previous version inputs"
    echo -e "• Provide further steps to follow"
    echo -e "• Provide user guidance for provisioning nodes"
    echo ""
    echo -e "${YELLOW}Note: Run the above command after the container is fully healthy and stable${NC}"
    echo -e "${YELLOW}================================================================================${NC}"
    echo ""
}

# Host-side paths (initialized dynamically after omnia_path is set)
OMNIA_INPUT_DIR=""
OMNIA_METADATA_DIR=""
OMNIA_METADATA_FILE=""

update_metadata_upgrade_backup_dir() {
    local backup_dir="$1"

    if ! podman ps --format '{{.Names}}' | grep -qw "omnia_core"; then
        echo "[ERROR] [ORCHESTRATOR] omnia_core container is not running"
        return 1
    fi

    podman exec -u root omnia_core bash -c "
        set -e
        if [ ! -f '$CONTAINER_METADATA_FILE' ]; then
            echo '[ERROR] Metadata file not found inside container: $CONTAINER_METADATA_FILE' >&2
            exit 1
        fi
        if grep -q '^upgrade_backup_dir:' '$CONTAINER_METADATA_FILE'; then
            sed -i 's|^upgrade_backup_dir:.*|upgrade_backup_dir: ${backup_dir}|' '$CONTAINER_METADATA_FILE'
        else
            echo 'upgrade_backup_dir: ${backup_dir}' >> '$CONTAINER_METADATA_FILE'
        fi
    "
}

# Resolve the upgrade guard lock path (container or host shared path)
get_upgrade_guard_lock_path() {
    local upgrade_guard_lock_container="/opt/omnia/.data/upgrade_in_progress.lock"
    local upgrade_guard_lock_host
    upgrade_guard_lock_host=$(podman exec -u root omnia_core grep '^oim_shared_path:' /opt/omnia/.data/oim_metadata.yml 2>/dev/null | cut -d':' -f2- | tr -d ' \t\n\r')
    if [ -n "$upgrade_guard_lock_host" ]; then
        upgrade_guard_lock_host="$upgrade_guard_lock_host/omnia/.data/upgrade_in_progress.lock"
    else
        upgrade_guard_lock_host="$upgrade_guard_lock_container"
    fi
    echo "$upgrade_guard_lock_host"
}

check_internal_nfs_export() {
    local nfs_server_ip="$1" nfs_server_share_path="$2"
    local exports line export_path share_path export_path_norm share_path_norm

    if ! is_local_ip "$nfs_server_ip"; then
        echo "The provided NFS server IP ($nfs_server_ip) is NOT the current system's IP."
        exit 1
    fi
    echo "The provided NFS server IP ($nfs_server_ip) belongs to the current system."

    if ! exports=$(showmount -e "$nfs_server_ip" 2>/dev/null); then
        echo -e "${RED}ERROR: Unable to contact NFS server at $nfs_server_ip. Ensure NFS and rpcbind are running, and firewall allows access.${NC}"
        exit 1
    fi

    # Normalize share path
    share_path="${nfs_server_share_path#"${nfs_server_share_path%%[![:space:]]*}"}"
    share_path="${share_path%"${share_path##*[![:space:]]}"}"
    share_path_norm="${share_path%/}"
    [[ -z "$share_path_norm" ]] && share_path_norm="/"

    # Check showmount exports
    while IFS= read -r line; do
        line="${line#"${line%%[![:space:]]*}"}"
        [[ -z "$line" || "$line" == \#* || "$line" == Export\ list\ for* ]] && continue
        export_path="${line%%[[:space:]]*}"
        [[ "$export_path" != /* ]] && continue
        export_path_norm="${export_path%/}"
        [[ -z "$export_path_norm" ]] && export_path_norm="/"
       
        if [[ "$share_path_norm" == "$export_path_norm" || "$share_path_norm" == "$export_path_norm"/* ]]; then
            echo -e "${GREEN}Path $nfs_server_share_path is covered by exported path $export_path_norm on $nfs_server_ip.${NC}"
            return 0
        fi
    done <<< "$exports"

    # Fallback: check /etc/exports if showmount didn't find a match
    if [[ -f /etc/exports ]]; then
        while IFS= read -r line; do
            line="${line#"${line%%[![:space:]]*}"}"
            [[ -z "$line" || "$line" == \#* ]] && continue
            export_path="${line%%[[:space:]]*}"
            [[ "$export_path" != /* ]] && continue
            export_path_norm="${export_path%/}"
            [[ -z "$export_path_norm" ]] && export_path_norm="/"
           
            if [[ "$share_path_norm" == "$export_path_norm" || "$share_path_norm" == "$export_path_norm"/* ]]; then
                echo -e "${GREEN}Path $nfs_server_share_path is covered by exported path $export_path_norm on $nfs_server_ip.${NC}"
                return 0
            fi
        done < /etc/exports
    fi

    echo -e "${RED}ERROR: Path $nfs_server_share_path is NOT exported by $nfs_server_ip.${NC}"
    exit 1
}

display_supported_use_cases() {
    # Color definitions
    BLUE='\033[1;34m'
    YELLOW='\033[1;33m'
    GREEN='\033[1;32m'
    NC='\033[0m' # No Color

    # Introductory Guidance
    echo -e "${BLUE} ----------------- Omnia Shared Path Configuration ---------------- ${NC}"
    echo -e "${BLUE} Please choose the type of Omnia shared path in Omnia Infrastructure Manager (OIM): ${NC}"
    echo -e "${BLUE} It is recommended to use a external NFS share for the Omnia shared path. ${NC}"
    echo -e "${BLUE} If you are not using NFS, make sure enough space is available on the disk. ${NC}"
    echo -e "\nSupported Use Cases:\n"

    # Table content
    {
        echo -e "Share Option\tType\tDescription\tAdditional Info"
        echo -e "${GREEN}NFS\tExternal\tExternal NFS server(outside OIM) created by user\tUsed only for flat provisioning. Mounts on OIM. ${NC}"
        echo -e "NFS\tInternal\tNFS server created by user in OIM\tUsed only for flat provisioning. No mount performed."
        echo -e "Local\tDisk\tDisk storage in OIM\tUsed only for flat provisioning. Directory to be created by user."
    } | column -t -s $'\t'
}


# This function is responsible for initializing the Omnia core container
# It prompts the user for the Omnia shared path and the root password.
# It checks if the Omnia shared path exists.
setup_omnia_core() {
    # Validate the system environment
    validate_oim

    # Initialize the container configuration
    init_container_config

    # Setup the container
    setup_container

    # Post container setup configuration
    post_setup_config

    remove_container_omnia_sh

    # Start the container
    start_container_session
}


# This function is responsible for cleaning up the Omnia core container.
# It removes the container and performs the necessary cleanup steps.
cleanup_omnia_core() {
    # Block if critical service containers exist
    critical_running=$(podman ps --format '{{.Names}}' | grep -E '^pulp$|^omnia_auth$|^minio-server$|^registry$|^step-ca$|^postgres$|^hydra$|^opaal-idp$|^smd$|^opaal$|^bss$|^cloud-init-server$|^haproxy$|^coresmd$|^omnia_build_stream$|^omnia_postgres$')
    if [ -n "$critical_running" ]; then
        echo -e "${RED}Failed to intiatiate omnia_core container cleanup. There are other critical service containers still running:${NC}"
        echo "$critical_running"
        echo -e "${GREEN}Run oim_cleanup.yml first to cleanup all containers.${NC}"
        exit 1
    fi

    echo -e "${RED} WARNING: This will remove Omnia core container and all files in Omnia Shared Path.${NC}"
    echo -e "${GREEN} You can abort and take backup if you want.${NC}"
    read -p " Are you sure you want to continue with the cleanup? (y/n): " confirm
    if [ "$confirm" = "n" ] || [ "$confirm" = "N" ]; then
        echo -e "${GREEN}Aborting.${NC}"
        exit 0
    elif [ "$confirm" = "y" ] || [ "$confirm" = "Y" ]; then

        # Fetch the configuration from the Omnia core container.
        fetch_config

        # Clear upgrade guard lock if present (shared path visible to container and host)
        local upgrade_guard_lock_path=$(get_upgrade_guard_lock_path)
        rm -f "$upgrade_guard_lock_path" >/dev/null 2>&1 || true
        echo "[INFO] [CLEANUP] Cleared upgrade guard lock (if present): $upgrade_guard_lock_path"

        # Remove the container
        remove_container

        # Perform the necessary cleanup steps
        cleanup_config
    fi
}


# This function is responsible for cleaning up the Omnia core container configuration.
# It removes the public key from the authorized_keys file.
# It removes the private key.
# It removes the ssh key from the known_hosts file.
# It removes the Omnia core configuration.
#
cleanup_config(){

    # Set the path to the ssh public key.
    ssh_key_file="$HOME/.ssh/oim_rsa.pub"

    # Remove the public key from the authorized_keys file.
    if [ -f "$ssh_key_file" ]; then
        # Remove the line from the authorized_keys file.
        sed -i "\|^$(cat $ssh_key_file)$|d" $HOME/.ssh/authorized_keys
        echo -e "${GREEN} Public key has been removed from authorized_keys.${NC}"
    else
        echo -e "${RED} Public key file not found.${NC}"
    fi

    # Remove the SSH key pair.
    ssh_key_file="$HOME/.ssh/oim_rsa"
    ssh_key_file_pub="${ssh_key_file}.pub"
    if [ -f "$ssh_key_file" ] && [ -f "$ssh_key_file_pub" ]; then
        rm -f "$ssh_key_file" "$ssh_key_file_pub"
        echo -e "${GREEN} SSH key pair have been removed.${NC}"
    else
        echo -e "${RED} SSH key file not found.${NC}"
    fi

    # Remove the ssh key from the known_hosts file.
    echo -e "${BLUE} Removing ssh key from known_hosts file.${NC}"
    ssh-keygen -R "[localhost]:2222" >/dev/null 2>&1


    # Remove the host entry from the config file in .ssh folder.
    ssh_config_file="$HOME/.ssh/config"
    if [ -f "$ssh_config_file" ]; then
        sed -i '/Host omnia_core/,+5d' "$ssh_config_file"
        echo -e "${GREEN} Host entry has been removed from config file.${NC}"
    else
        echo -e "${RED} Config file not found.${NC}"
    fi

    # Remove the Omnia core configuration.
    echo -e "${BLUE} Removing Omnia core configuration.${NC}"
    rm -rf $omnia_path/omnia/{hosts,input,log,pulp,provision,pcs,ssh_config,tmp,.data}

    # Unmount the NFS shared path if the share option is NFS.
    if [ "$share_option" = "NFS" ] && [ "$nfs_type" = "external" ]; then
        umount "$omnia_path"
        if [ $? -eq 0 ]; then
            echo -e "${GREEN} NFS shared path has been unmounted.${NC}"
        else
            echo -e "${RED} Failed to unmount NFS shared path.${NC}"
        fi
        # Remove the entry from /etc/fstab
        fstab_file="/etc/fstab"
        if [ -f "$fstab_file" ]; then
            # Create a backup of the fstab file.
            cp "$fstab_file" "$fstab_file.bak"

            # Remove the line from the fstab file.
             sed -i "\#$omnia_path#d" "$fstab_file"
             if [ $? -ne 0 ]; then
                echo -e "${RED} Failed to remove the entry from /etc/fstab.${NC}"
            fi
        fi
    fi

    echo -e "${GREEN} Omnia core configuration has been cleaned up.${NC}"
}

# This function is responsible for removing the Omnia core container.
#
# It removes the container using the 'podman rm -f' command.
# If the container is removed successfully, it prints a success message.
# Otherwise, it prints an error message.
remove_container() {
    # Block if critical service containers exist
    critical_running=$(podman ps --format '{{.Names}}' | grep -E '^pulp$|^omnia_auth$|^minio-server$|^registry$|^step-ca$|^postgres$|^hydra$|^opaal-idp$|^smd$|^opaal$|^bss$|^cloud-init-server$|^haproxy$|^coresmd$|^omnia_build_stream$|^omnia_postgres$')
    if [ -n "$critical_running" ]; then
        echo -e "${RED}Failed to intiatiate omnia_core container cleanup. There are other critical service containers still running:${NC}"
        echo "$critical_running"
        echo -e "${GREEN}Run oim_cleanup.yml first to cleanup all containers.${NC}"
        exit 1
    fi

    # Remove the container.
    echo -e "${BLUE} Removing the Omnia core container.${NC}"
    if systemctl stop omnia_core.service; then
        echo -e "${GREEN} Omnia core container has been removed.${NC}"
        # Remove the systemd generator symlinks.
        echo -e "${GREEN} Cleaning up systemd generator symlinks.${NC}"
        rm -f /run/systemd/generator/omnia_core.service
        rm -f /run/systemd/generator/multi-user.target.wants/omnia_core.service
        rm -f /run/systemd/generator/default.target.wants/omnia_core.service

        echo -e "${GREEN} Cleaning up omnia_core.container.${NC}"
        rm -f /etc/containers/systemd/omnia_core.container

    # Remove the omnia_core.service file.
        rm -f /etc/systemd/system/omnia_core.service
        systemctl daemon-reload
        systemctl reset-failed omnia_core.service
    # check if service is removed
        if systemctl status omnia_core.service >/dev/null 2>&1; then
            echo -e "${RED} Failed to remove Omnia core service.${NC}"
        else
            echo -e "${GREEN} Omnia core service has been removed.${NC}"
        fi    
    else
        echo -e "${RED} Failed to remove Omnia core container.${NC}"
    fi

    # Remove the container image.
    # if podman rmi omnia_core; then
    #     echo -e "${GREEN} Omnia core image has been removed.${NC}"
    # else
    #     echo -e "${RED} Failed to remove Omnia core image.${NC}"
    # fi
}


# This function is responsible for initializing the Omnia core container.
#
# It prompts the user for the Omnia shared path and the root
# password. It then checks if the Omnia shared path exists.
#
# The function generates the ssh key pair and copies the private
# key to the Omnia shared path.
#
# The function also copies the ssh public key to the
# authorized_keys file.
#
# The function creates the necessary log directories.
init_container_config() {

    share_option=""
    # Display the supported use cases
    display_supported_use_cases

    # Display the choices for the user
    echo -e "${BLUE} Choose the type of Omnia shared path:${NC}"
    options=( "NFS (recommended)" "Local"  )

    PS3="Select the option number: "

    select opt in "${options[@]}"; do
        case $opt in
            "NFS (recommended)")
                share_option="NFS"
                break
                ;;
            "Local")
                share_option="Local"
                break
                ;;
            *)
                echo -e "${RED} Invalid option.${NC}"
                continue
        esac
    done

    case $share_option in
        "Local")
            # Prompt the user for the Omnia shared path.
            echo -e "${BLUE} Please provide Omnia shared path:${NC}"
            read -p "Omnia shared path: " omnia_path

            # Check if the Omnia shared path is absolute path and path exists.
            if [[ "$omnia_path" != /* ]] || [ ! -d "$omnia_path" ]; then
                echo -e "${RED} Omnia shared path is not an absolute path or does not exist! Please re-run omnia.sh --install with valid Omnia shared path.${NC}"
                exit 1
            fi
            ;;
        "NFS")
            echo -e "${BLUE} Select NFS type:${NC}"
            select nfs_type in "External (Recommended)" "Internal"; do
                case $nfs_type in
                    "External (Recommended)")
                        echo -e "${BLUE} Please provide the external NFS server IP:${NC}"
                        read -p "External NFS server IP: " nfs_server_ip

                        echo -e "${BLUE} Please provide the external NFS server share path:${NC}"
                        read -p "External NFS share path: " nfs_server_share_path

                        echo -e "${BLUE} Please provide the OIM client share path (mount target):${NC}"
                        read -p "Omnia shared path: " omnia_path

                        # Validate Omnia shared path is absolute
                        if [[ "$omnia_path" != /* ]]; then
                            echo -e "${RED}Omnia shared path must be an absolute path.${NC}"
                            exit 1
                        fi

                        nfs_type="external"
                        break
                        ;;
                    "Internal")
                        echo -e "${BLUE} Please provide the OIM server IP:${NC}"
                        read -p "OIM server IP: " nfs_server_ip

                        echo -e "${BLUE} Please provide the OIM server share path:${NC}"
                        read -p "OIM server share path: " nfs_server_share_path

                        echo -e "${BLUE} Checking if the OIM server share path is mounted${NC}"
                        check_internal_nfs_export "$nfs_server_ip" "$nfs_server_share_path"

                        # Note: No mounting performed here
                        echo -e "${YELLOW}Note: Internal NFS does not support HA OIM or hierarchical cluster. Proceeding...${NC}"
                        nfs_type="internal"
                        omnia_path="$nfs_server_share_path"
                        break
                        ;;
                    *)
                        echo -e "${RED}Invalid option. Please choose 1 or 2.${NC}"
                        ;;
                esac
            done
            ;;
    esac


    # Prompt the user for the Omnia core root password.
    echo -e "${BLUE} Please provide Omnia core root password for accessing container:${NC}"

    read -p " Enter: " -s passwd

    # Prompt the user for the Omnia core root password confirmation.
    echo -e "\n${BLUE} Please confirm password:${NC}"
    read -s -p " Enter: " cnf_passwd

    # Check if the provided passwords match.
    if [ "$passwd" != "$cnf_passwd" ]; then
        echo -e "${RED} Invalid Omnia core root password, passwords do not match!${NC}"
        exit 1
    fi

    # Check if the password contains any of the invalid characters
    invalid_chars='[\\|&;`"><*?!$(){}[\]]'
    if [[ "$passwd" =~ $invalid_chars ]]; then
        echo -e "${RED} Invalid password, passwords must not contain any of these special characters: [\\|&;\`\"><*?!$(){}[\]]${NC}"
        exit 1
    fi

    # Install NFS client package if option NFS is selected
    if [[ "$share_option" == "NFS" ]]; then
        # Install NFS client package
        echo -e "${BLUE} Installing NFS client package.${NC}"
        dnf install -y nfs-utils nfs4-acl-tools

        # Create omnia_path directory if it does not exist
        echo -e "${BLUE} Creating omnia shared path directory if it does not exist.${NC}"
        mkdir -p $omnia_path

        # Mount NFS server share path in Omnia share path
        if [[ "$nfs_type" == "external" ]]; then

            if is_local_ip "$nfs_server_ip"; then
                echo -e "${RED} Error: NFS server $nfs_server_ip is a local IP.${NC}"
                echo -e "${RED} Please provide an external NFS server IP or re-run omnia.sh --install with valid options.${NC}"
                exit 1
            fi

            # Validate if NFS server is reachable
            echo -e "${BLUE} Validating if NFS server is reachable.${NC}"
            ping -c1 -W1 $nfs_server_ip > /dev/null
            if [ $? -ne 0 ]; then
                echo -e "${RED} NFS server $nfs_server_ip is not reachable.${NC}"
                exit 1
            fi

            echo -e "${BLUE} Mounting NFS server share path in Omnia share path.${NC}"
            mount -t nfs -o nosuid,rw,sync,hard,intr,timeo=30 "$nfs_server_ip:$nfs_server_share_path" "$omnia_path"
            if [[ $? -ne 0 ]]; then
                echo -e "${RED} Failed to mount NFS. Please check the IP and path.${NC}"
                exit 1
            fi
            # Validate if NFS server share path is mounted
            echo -e "${BLUE} Validating if NFS server share path is mounted.${NC}"
            # strip the trailing slash from nfs_server_share_path
            nfs_server_share_path="${nfs_server_share_path%/}"
            if grep -qs "$nfs_server_ip:$nfs_server_share_path" /proc/mounts; then
                echo -e "${GREEN} NFS server share path is mounted.${NC}"
            else
                echo -e "${RED} NFS server share path is not mounted. Provide valid NFS server details. ${NC}"
                exit 1
            fi
            # Add NFS server share to /etc/fstab to mount on startup
            echo "$nfs_server_ip:$nfs_server_share_path $omnia_path nfs nosuid,rw,sync,hard,intr" >> /etc/fstab
        else
            echo -e "${BLUE} Using internal NFS path without mounting.${NC}"
        fi

    fi

    hashed_passwd=$(openssl passwd -1 $passwd)
    ssh_key_file="/root/.ssh/oim_rsa"
    ssh_port=2222

    # Generate a new ssh key pair.
    if [ -f "$ssh_key_file" ]; then
        echo -e "\n${BLUE} Skipping generating new ssh key pair.${NC}"
    else
        echo -e "\n${GREEN} Generating a new ssh key pair.${NC}"
        ssh-keygen -t rsa -b 4096 -C "omnia_oim" -q -N '' -f /root/.ssh/oim_rsa
        {
            echo "Host omnia_core"
            echo "    Hostname localhost"
            echo "    Port $ssh_port"
            echo "    User root"
            echo "    IdentityFile ~/.ssh/oim_rsa"
            echo "    IdentitiesOnly yes"
        } >> $HOME/.ssh/config
    fi

    # Create the ssh configuration directory if it does not exist.
    echo -e "${GREEN} Creating the ssh configuration directory if it does not exist.${NC}"
    mkdir -p "$omnia_path/omnia/ssh_config/.ssh"

    # Copy the omnia_core ssh config to the shared path.
    echo -e "${GREEN} Copying the omnia_core ssh config to the omnia shared path.${NC}"
    cp "$HOME/.ssh/config" "$omnia_path/omnia/ssh_config/.ssh/config"

    # Copy the oim_rsa ssh key to the shared path.
    echo -e "${GREEN} Copying the oim_rsa ssh key to the omnia shared path.${NC}"
    cp "$HOME/.ssh/oim_rsa" "$omnia_path/omnia/ssh_config/.ssh/oim_rsa"

    # Copy the ssh private key to the omnia shared path.
    echo -e "${GREEN} Copying the ssh private key to the omnia shared path.${NC}"
    cp $ssh_key_file "$omnia_path/omnia/ssh_config/.ssh/id_rsa"

    # Copy the ssh public key to the omnia shared path.
    echo -e "${GREEN} Copying the ssh public key to the omnia shared path.${NC}"
    cp $ssh_key_file.pub "$omnia_path/omnia/ssh_config/.ssh/id_rsa.pub"

    # Get the ssh public key.
    ssh_public_key="$(cat /root/.ssh/oim_rsa.pub)"

    validate_nfs_server

    # Add ssh public key to the authorized_keys.
    echo -e "${GREEN} Adding ssh public key to the authorized_keys.${NC}"
    if grep -q "$ssh_public_key" $HOME/.ssh/authorized_keys; then
        echo -e "${BLUE} Skipping adding ssh public key to the authorized_keys.${NC}"
    else
        echo "$ssh_public_key" >> $HOME/.ssh/authorized_keys
        chmod 600 $HOME/.ssh/authorized_keys
    fi

    # Add ssh public key to the authorized_keys in the ssh_config directory.
    echo -e "${GREEN} Adding ssh public key to the authorized_keys in the Omnia ssh_config directory.${NC}"
    if [ -f "$omnia_path/omnia/ssh_config/.ssh/authorized_keys" ] && grep -q "$ssh_public_key" "$omnia_path/omnia/ssh_config/.ssh/authorized_keys"; then
        echo -e "${BLUE} Skipping adding ssh public key to the authorized_keys in the Omnia ssh_config directory.${NC}"
    else
        echo "$ssh_public_key" >> "$omnia_path/omnia/ssh_config/.ssh/authorized_keys"
        chmod 600 "$omnia_path/omnia/ssh_config/.ssh/authorized_keys"
    fi

    # Create the log directory if it does not exist.
    echo -e "${GREEN} Creating the log directory if it does not exist.${NC}"
    mkdir -p "$omnia_path/omnia/log/core/container"
    mkdir -p "$omnia_path/omnia/log/core/playbooks"

    # Create the hosts file for cluster in $omnia_path/omnia/hosts
    echo -e "${GREEN} Creating the hosts file for cluster.${NC}"
    touch "$omnia_path/omnia/hosts"

    # Create the pulp_ha directory if it does not exist.
    echo -e "${GREEN} Creating the pulp HA directory if it does not exist.${NC}"
    mkdir -p "$omnia_path/omnia/pulp/pulp_ha"

    # Initialize host-side path variables based on user-provided omnia_path
    OMNIA_INPUT_DIR="$omnia_path/omnia/input"
    OMNIA_METADATA_DIR="$omnia_path/omnia/.data"
    OMNIA_METADATA_FILE="$omnia_path/omnia/.data/oim_metadata.yml"
}


# This function is responsible for fetching the configuration from the Omnia core.
# It uses podman exec to run a command in the Omnia core container.
# The command retrieves the metadata from the oim_metadata.yml file.
# The metadata is then parsed and the required configuration is extracted.
fetch_config() {

    # Fetch the metadata from the oim_metadata.yml file.
    echo -e "${GREEN} Fetching the metadata from the oim_metadata.yml file.${NC}"
        core_config=$(podman exec -ti omnia_core /bin/bash -c 'cat /opt/omnia/.data/oim_metadata.yml')

    # Split the metadata into separate lines.
    IFS=$'\n' read -r -d '' -a config_lines <<<"$core_config"

    # Loop through the lines and extract the required configuration.
    for line in "${config_lines[@]}"; do
        # Extract the key and value from the line.
        key=$(echo "$line" | awk -F ':' '{print $1}')
        value=$(echo "$line" | awk -F ':' '{print $2}')

        # Check the key and assign the value to the corresponding variable.
        case $key in
            oim_shared_path)
                # Assign the shared path.
                omnia_path=$(echo "$value" | tr -d '[:space:]')
                ;;
            omnia_core_hashed_passwd)
                # Assign the hashed password.
                hashed_passwd=$(echo "$value" | tr -d '[:space:]')
                ;;
            nfs_server_ip)
                # Assign the nfs server ip.
                nfs_server_ip=$(echo "$value" | tr -d '[:space:]')
                ;;
            nfs_server_share_path)
                # Assign the nfs server share path.
                nfs_server_share_path=$(echo "$value" | tr -d '[:space:]')
                ;;
            omnia_share_option)
                # Assign the share option.
                share_option=$(echo "$value" | tr -d '[:space:]')
                ;;
            nfs_type)
                # Assign the share option.
                nfs_type=$(echo "$value" | tr -d '[:space:]')
                ;;
        esac
    done
    # Check if the required configuration is extracted successfully.
    if [ -z "$omnia_path" ] || [ -z "$hashed_passwd" ]; then
        echo -e "${RED} Failed to fetch data from metadata file.${NC}"
        exit 1
    else
        echo -e "${GREEN} Successfully fetched data from metadata file.${NC}"
    fi

    # Initialize host-side path variables based on fetched omnia_path
    OMNIA_INPUT_DIR="$omnia_path/omnia/input"
    OMNIA_METADATA_DIR="$omnia_path/omnia/.data"
    OMNIA_METADATA_FILE="$omnia_path/omnia/.data/oim_metadata.yml"
}

# Validates the OIM (Omnia Infrastructure Manager) by checking if the hostname is
# configured with a domain name, checking if Podman is installed, enabling and
# starting the Podman socket.
validate_oim() {
    # Check if the hostname is set
    hostname_value=$(hostname)
    if [[ -z "$hostname_value" ]]; then
        echo -e "${RED}Hostname is not set!${NC}"
        exit 1
    fi

    # Check if the hostname is static
    static_hostname=$(hostnamectl --static)
    current_hostname=$(hostname)
    if [[ "$static_hostname" != "$current_hostname" ]]; then
        echo -e "${RED}Static Hostname is unset. Current: '$current_hostname', Static: '$static_hostname'${NC}"
        echo -e "${RED}Please set the static hostname and try again.${NC}"
        echo -e "${BLUE}Command to set hostname: hostnamectl set-hostname <hostname>${NC}"
        echo -e "${RED}Exiting...${NC}"
        exit 1
    fi

    # Check if the hostname is configured with a domain name.
    domain_name=$(hostname -d)
    if [[ -n "$domain_name" ]]; then
        echo -e "${BLUE}Hostname is configured with a domain name: $domain_name${NC}"
    else
        echo -e "${RED}Invalid hostname, hostname is not configured with a domain name!${NC}"
        exit 1
    fi

    # Detect OIM timezone from systemd in a stable, case‑independent way
    oim_timezone=$(timedatectl show -p Timezone --value 2>/dev/null)

    # Fallbacks if needed (non‑systemd or old timedatectl)
    if [[ -z "$oim_timezone" ]]; then
        if [[ -f /etc/timezone ]]; then
            # Debian/Ubuntu style
            oim_timezone=$(< /etc/timezone)
        elif [[ -L /etc/localtime ]]; then
            # Derive from /etc/localtime symlink
            oim_timezone=$(readlink -f /etc/localtime | sed -n 's|^.*zoneinfo/||p')
        fi
    fi

    podman --version

    # Capture the exit status
    if [ $? -eq 0 ]; then
        echo -e "${BLUE} Podman is installed. Version: $(podman --version)${NC}"
    else
        echo -e "${RED} Podman is not installed.${NC}"
        exit 1
    fi

    # Enable the podman socket to start at boot
    echo -e "${BLUE} Enabling podman.socket...${NC}"
    systemctl enable podman.socket

    # Start the podman socket now
    echo -e "${BLUE} Starting podman.socket...${NC}"
    systemctl start podman.socket

    # Print a success message after enabling and starting the podman socket
    echo -e "${GREEN} Podman socket has been enabled and started.${NC}"
}

# Checks if the required directories for Omnia are present.
# This function iterates over a list of required directories/files and checks if each one exists.
check_required_directories() {
    required_paths=(
        "$omnia_path/omnia"
        "$omnia_path/omnia/ssh_config/.ssh"
        "$omnia_path/omnia/log/core/container"
        "$omnia_path/omnia/hosts"
        "$omnia_path/omnia/pulp/pulp_ha"
    )

    missing_paths=()

    for path in "${required_paths[@]}"; do
        if [ ! -e "$path" ]; then  # Checks both files and directories
            missing_paths+=("$path")
        fi
    done

    if [ "${#missing_paths[@]}" -ne 0 ]; then
        echo -e "${RED}Error: The following required files or directories are missing:${NC}"
        echo -e "${RED}${missing_paths[*]}${NC}"
        echo -e "User can not Retain Existing configuration"
        echo
        echo -e "${YELLOW}Instructions:${NC}"
        echo -e "${YELLOW}* Backup any existing files if required${NC}"
        echo -e "${YELLOW}* Run ./omnia.sh --install and choose:${NC}"
        echo -e "${YELLOW}    Options:${NC}"
        echo -e "${YELLOW}      -> Reinstall the container${NC}"
        echo -e "${YELLOW}      -> Overwrite and create new configuration${NC}"
        exit 1
    fi
}

# Sets up the Omnia core container.
# This function pulls the Omnia core Podman image and runs the container.
# Creates a Quadlet service for the container and also creates a metadata file.
# It defines the container options and runs the container.
setup_container() {
    container_name="omnia_core"
    echo "==> Setting up $container_name container"

    # SELinux option handling
    selinux_option=":z"
    if [ "$share_option" = "NFS" ] && [ "$nfs_type" = "external" ]; then
        selinux_option=""
    fi

    # --- Generate Quadlet container file ---
    cat > /etc/containers/systemd/${container_name}.container <<EOF
# ===============================================================
# $container_name Quadlet Service
# Generated dynamically by omnia.sh
# ===============================================================
[Unit]
Description=${container_name^} Container

[Container]
ContainerName=${container_name}
HostName=${container_name}
Image=${container_name}:2.1
Network=host

# Capabilities
AddCapability=CAP_AUDIT_WRITE

# Volumes
Volume=${omnia_path}/omnia:/opt/omnia${selinux_option}
Volume=${omnia_path}/omnia/ssh_config/.ssh:/root/.ssh${selinux_option}
Volume=${omnia_path}/omnia/log/core/container:/var/log${selinux_option}
Volume=${omnia_path}/omnia/hosts:/etc/hosts${selinux_option}
Volume=${omnia_path}/omnia/pulp/pulp_ha:/root/.config/pulp${selinux_option}

[Service]
Restart=always

[Install]
WantedBy=multi-user.target default.target

EOF

    # Create the .data directory if it does not exist.
    # This is where the oim_metadata.yml file is stored.
    echo -e "${GREEN} Creating the .data directory if it does not exist.${NC}"
    mkdir -p "$OMNIA_METADATA_DIR"

    oim_metadata_file="$OMNIA_METADATA_FILE"

    # Get version from git tag or use default
    local metadata_version=$(get_metadata_version "$omnia_release")
    
    if [ ! -f "$oim_metadata_file" ]; then
        echo -e "${GREEN} Creating oim_metadata file${NC}"
        {
            echo "oim_crt: \"podman\""
            echo "oim_shared_path: $omnia_path"
            echo "omnia_version: $metadata_version"
            echo "oim_hostname: $(hostname)"
            echo "oim_node_name: $(hostname -s)"
            echo "domain_name: $domain_name"
            echo "oim_timezone: $oim_timezone"
            echo "omnia_core_hashed_passwd: $hashed_passwd"
            echo "omnia_share_option: $share_option"
        } >> "$oim_metadata_file"
        if [ "$share_option" = "NFS" ]; then
            {
            echo "nfs_server_ip: $nfs_server_ip"
            echo "nfs_server_share_path: $nfs_server_share_path"
            echo "nfs_type: $nfs_type"
        } >> "$oim_metadata_file"
        fi
    else
        sed -i '/^upgrade_backup_dir:/d' "$oim_metadata_file" >/dev/null 2>&1 || true
        if grep -q '^omnia_version:' "$oim_metadata_file"; then
            sed -i "s/^omnia_version:.*/omnia_version: $metadata_version/" "$oim_metadata_file" >/dev/null 2>&1 || true
        else
            echo "omnia_version: $metadata_version" >> "$oim_metadata_file"
        fi
    fi

    # --- Remove old service if exists ---
    if systemctl list-unit-files | grep -q "${container_name}.service"; then
        systemctl stop ${container_name}.service
        systemctl disable ${container_name}.service
        rm -f /etc/systemd/system/${container_name}.service
    fi

    # --- Reload systemd so Quadlet generates the service ---
    systemctl daemon-reexec
    systemctl daemon-reload
    systemctl start ${container_name}.service

    # --- Start the container via Quadlet ---
    echo "==> ${container_name} container deployed and starting via Quadlet"

    # --- Wait for container to be running ---
    echo "Waiting for $container_name container to start..."
    for i in {1..30}; do
        if podman ps --format '{{.Names}}' | grep -qw "$container_name"; then
            echo "$container_name container is running."
            break
        else
            sleep 1
        fi
    done

    if ! podman ps --format '{{.Names}}' | grep -qw "$container_name"; then
        echo -e "${RED}Error: $container_name container failed to start.${NC}"
        rm -rf "$OMNIA_METADATA_FILE"
        exit 1
    fi

    systemctl start firewalld
    systemctl enable firewalld
    firewall-cmd --permanent --zone=public --add-port=2222/tcp
    firewall-cmd --reload
}
#  post_setup_config is a function that sets up the configuration for the Omnia core.
#  It creates the necessary directories and files, copies input files from the Omnia container,
#  and creates the oim_metadata.yml file.
post_setup_config() {

    # Create the ansible tmp directory if it does not exist.
    mkdir -p "$omnia_path/omnia/tmp/.ansible/tmp"
    chmod 757 "$omnia_path/omnia/tmp/.ansible/tmp"
    # Create the input directory if it does not exist.
    echo -e "${GREEN} Creating the input directory if it does not exist.${NC}"
    mkdir -p "$OMNIA_INPUT_DIR/"

    # Create the default.yml file if it does not exist.
    if [ ! -f "$OMNIA_INPUT_DIR/default.yml" ]; then
        echo -e "${BLUE} Creating default.yml file.${NC}"
        {
            echo "# This file defines the project name."
            echo "# The name of the project should be set in a directory under input."
            echo "project_name: project_default"
        } >> "$OMNIA_INPUT_DIR/default.yml"
    fi

    # Copy input files from /omnia to /opt/omnia/project_default/ inside omnia_core container
    podman exec -u root omnia_core bash -c "cd /omnia && git pull"
    echo -e "${BLUE} Moving input files from /omnia dir to project_default folder.${NC}"
    podman exec -u root omnia_core bash -c "
    mkdir -p /opt/omnia/input/project_default
    cp -r /omnia/input/* /opt/omnia/input/project_default
    rm -rf /omnia/input
    rm -rf /omnia/omnia.sh"

    init_ssh_config
}

validate_nfs_server() {
    if [ "$share_option" = "NFS" ]; then
        local temp_file="$omnia_path/temp_file"
        touch "$temp_file"
        if chown root:root "$temp_file"; then
            rm -f "$temp_file"
        else
            echo "Error: Unable to chown file to root in $omnia_path. NFS server permission validation failed. Please ensure no_root_squash option is enabled in the NFS export configuration."
            exit 1
        fi

        if [ "`ls -ld $omnia_path/omnia/ssh_config/.ssh/id_rsa | awk '{print $3 ":" $4}'`" != "root:root" ]; then
            echo "Error: The $omnia_path/omnia/ssh_config/.ssh/id_rsa file should be owned by root:root. NFS server permission validation failed. Please verify the NFS export configuration."
            exit 1
        fi
    fi
}

init_ssh_config() {
    local ssh_port=2222

    mkdir -p "$HOME/.ssh"
    touch "$HOME/.ssh/known_hosts"
    ssh-keygen -R "[localhost]:$ssh_port" >/dev/null 2>&1 || true
    ssh-keyscan -p "$ssh_port" localhost 2>/dev/null | grep -v "^#" >> "$HOME/.ssh/known_hosts" || true
}

remove_container_omnia_sh() {
    podman exec -u root omnia_core bash -c 'if [ -f /omnia/omnia.sh ]; then rm -f /omnia/omnia.sh; fi' >/dev/null 2>&1 || true
    podman exec -u root omnia_core bash -c 'if [ -d /omnia/input ]; then rm -rf /omnia/input; fi' >/dev/null 2>&1 || true
}

start_container_session() {

    echo -e "${GREEN}
    ------------------------------------------------------------------------------------------------------------------------------------------
            Omnia Core container running successfully.

            Entering the container from Omnia Infrastructure Manager(OIM):
            Through podman:
            # podman exec -it -u root omnia_core bash

            Direct SSH:
            # ssh omnia_core

            You are now in the Omnia environment.

            The following are the main directories available in the Omnia core container:

            - The shared directory, which is mapped to $omnia_path in OIM: /opt/omnia
            - The input directory: /opt/omnia/input
            - The Omnia source code directory: /omnia
            - The Omnia playbooks logs directory: /opt/omnia/log/core/playbooks

            It's important to note:
                - Files placed in the shared directory should not be manually deleted.
                - Use the playbook /omnia/utils/oim_cleanup.yml to safely remove the shared directory and Omnia containers (except the core container).
                - If you need to delete the core container, please run the omnia.sh script with --uninstall option.
                - If you need to  redeploy the core container with new input configs, please rerun the omnia.sh script with --install option.
                - Provide any file paths (ISO, mapping files, etc.) that are mentioned in input files in the /opt/omnia directory.
                - The domain name that will be used for Omnia is $domain_name, if you wish to change the domain name please cleanup Omnia,
                  change the Omnia Infrastructure Manager's domain name and rerun omnia.sh script with --install option.

    --------------------------------------------------------------------------------------------------------------------------------------------------
    ${NC}"

    init_ssh_config

    # Update metadata with git tag version from inside container
    update_metadata_with_git_tag "$omnia_release"

    # Entering Omnia-core container
    ssh omnia_core
}

show_help() {
    echo "Usage: $0 [--install | --uninstall | --upgrade | --rollback | --version | --help]"
    echo "  -i, --install     Install and start the Omnia core container"
    echo "  -u, --uninstall   Uninstall the Omnia core container and clean up configuration"
    echo "      --upgrade     Upgrade the Omnia core container to newer version"
    echo "      --rollback    Rollback the Omnia core container to previous version"
    echo "  -v, --version     Display Omnia version information"
    echo "  -h, --help        More information about usage"
}

install_omnia_core() {
    # Detect existing Omnia 2.0 installation
    if podman ps --format '{{.Names}}' | grep -qw "omnia_core"; then
        # Read version from metadata inside container
        current_version=$(podman exec -u root omnia_core grep '^omnia_version:' /opt/omnia/.data/oim_metadata.yml 2>/dev/null | cut -d':' -f2 | tr -d ' \t\n\r')
        if [ "$current_version" = "2.0.0.0" ]; then
            echo -e "${RED}ERROR: Existing Omnia 2.0 installation detected.${NC}"
            echo -e "${YELLOW}To upgrade, run: $0 --upgrade${NC}"
            echo -e "${YELLOW}For a fresh install, first run: $0 --uninstall${NC}"
            exit 1
        fi
    fi
    
    local omnia_core_tag="2.1"
    local omnia_core_registry=""
    
    # Check if local omnia_core image exists using validate function
    if ! validate_container_image "" "$omnia_core_tag" "install"; then
        exit 1
    fi
    echo -e "${GREEN}✓ Omnia core image (omnia_core:${omnia_core_tag}) found locally.${NC}"

    # Check if any other containers with 'omnia' in their name are running
    other_containers=$(podman ps -a --format '{{.Names}}' | grep -E 'omnia' | grep -v 'omnia_core')

    # If there are any, exit
    if [ -n "$other_containers" ]; then
        echo -e "${RED} Failed to intiatiate omnia_core container cleanup. There are other omnia container running.${NC}"
        echo -e "${GREEN} Execute oim_cleanup.yml first to cleanup all containers.${NC}"
        ssh omnia_core
        exit 1
    fi

    # Check if the omnia_core container is already running
    running_containers=$(podman ps -a --format '{{.Names}} {{.State}}' | grep -E 'omnia_core')

    # If yes, set the variable to true
    if [ -n "$running_containers" ]; then
        core_container_status=true
    fi

    # If core container is running
    if [ "$core_container_status" = true ]; then
        if [ -n "$(echo "$running_containers" | grep -E 'running')" ]; then
            echo -e "${GREEN} Omnia core container is already running.${NC}"
            echo -e "${GREEN} Do you want to:${NC}"
            PS3="Select the option number: "

            select opt in "Enter omnia_core container" "Reinstall the container" "Exit"; do
                case $opt in
                    "Enter omnia_core container")
                        choice=1
                        break
                        ;;
                    "Reinstall the container")
                        choice=2
                        break
                        ;;
                    "Exit")
                        echo "Exiting the script."
                        exit 0
                        ;;
                    *)
                        echo "Invalid choice. Please try again."
                        continue
                        ;;
                esac
            done

            # If the user wants to enter omnia_core container
            if [ "$choice" = "1" ]; then
                start_container_session
            fi
            # If the user wants to reinstall, call the remove_container function, and then call the setup_omnia_core function
            if [ "$choice" = "2" ]; then
                # Block if critical service containers exist
                critical_running=$(podman ps --format '{{.Names}}' | grep -E '^pulp$|^omnia_auth$|^minio-server$|^registry$|^step-ca$|^postgres$|^hydra$|^opaal-idp$|^smd$|^opaal$|^bss$|^cloud-init-server$|^haproxy$|^coresmd$|^omnia_build_stream$|^omnia_postgres$')
                if [ -n "$critical_running" ]; then
                    echo -e "${RED}Failed to intiatiate omnia_core container cleanup. There are other critical service containers still running:${NC}"
                    echo "$critical_running"
                    echo -e "${GREEN}Run oim_cleanup.yml first to cleanup all containers.${NC}"
                    exit 1
                fi
                echo -e "${GREEN} What configuration do you want to use for reinstallation:${NC}"

                PS3="Select the option number: "

                select opt in "Retain Existing configuration" "Overwrite and create new configuration" "Exit"; do
                    case $opt in
                        "Retain Existing configuration")
                            choice=1
                            break
                            ;;
                        "Overwrite and create new configuration")
                            choice=2
                            break
                            ;;
                        "Exit")
                            echo "Exiting the script."
                            exit 0
                            ;;
                        *)
                            echo "Invalid choice. Please try again."
                            continue
                            ;;
                    esac
                done

                # If the user wants to retain existing configuration, call the remove_container function
                if [ "$choice" = "1" ]; then
                    fetch_config
                    check_required_directories
                    remove_container
                    setup_container
                    init_ssh_config
                    start_container_session
                # If the user wants to overwrite and create new configuration, call the cleanup_omnia_core function
                elif [ "$choice" = "2" ]; then
                    cleanup_omnia_core
                    setup_omnia_core
                fi
            fi
        else
            # If omnia_core container exists and is not running call the remove_container function

            echo -e "${RED} The Omnia Core container is present but not in running state.${NC}"
            echo -e "${GREEN} Only the core container can be cleanup can be performed.${NC}"
            echo -e "${GREEN} Container Configurations in the shared directory will not be cleaned up.${NC}"
            echo -e "${GREEN} Do you want to perform cleanup:${NC}"
            echo -e "${GREEN} 1. Yes.${NC}"
            echo -e "${GREEN} 2. No. ${NC}"
            read -p " Enter your choice (1 or 2): " choice
            if [ "$choice" = "1" ]; then
                remove_container
            elif [ "$choice" = "2" ]; then
                exit
            fi
        fi

    # If core container is not present
    else
        setup_omnia_core
    fi
}

# Check if Omnia core container is running
check_container_status() {
    # Check if the Omnia core container is running
    if ! podman ps --format '{{.Names}}' | grep -qw "omnia_core"; then
        echo -e "${RED}ERROR: Omnia core container is not running.${NC}"
        exit 1
    fi
}

# Function to display version information
display_version() {
    # Check if metadata file exists and Omnia core container is running
    check_container_status
    
    # Fetch the metadata from the oim_metadata.yml file in the container
    echo -e "${GREEN} Fetching metadata from omnia_core container...${NC}"
    core_config=$(podman exec omnia_core /bin/bash -c 'cat /opt/omnia/.data/oim_metadata.yml')
    
    # Extract Omnia version from metadata file
    omnia_version=$(echo "$core_config" | grep "omnia_version:" | cut -d':' -f2 | tr -d ' \t\n\r')
    
    # Display version information
    echo "Omnia version: $omnia_version"
    
    # Return exit code 0 on success
    exit 0
}

phase1_validate() {
    local current_image
    local core_config
    local previous_omnia_version
    local shared_path

    echo "[INFO] [ORCHESTRATOR] Phase 1: Pre-Upgrade Validation"

    if ! podman ps --format '{{.Names}}' | grep -qw "omnia_core"; then
        echo "[ERROR] [ORCHESTRATOR] Prerequisite failed: omnia_core container is not running"
        display_cleanup_instructions
        return 1
    fi

    core_config=$(podman exec omnia_core /bin/bash -c 'cat /opt/omnia/.data/oim_metadata.yml' 2>/dev/null)
    if [ -z "$core_config" ]; then
        echo "[ERROR] [ORCHESTRATOR] Unable to read oim_metadata.yml from omnia_core container"
        display_cleanup_instructions
        return 1
    fi

    previous_omnia_version=$(echo "$core_config" | grep "^omnia_version:" | cut -d':' -f2 | tr -d ' \t\n\r')
    if [ -z "$previous_omnia_version" ]; then
        echo "[ERROR] [ORCHESTRATOR] omnia_version not found in oim_metadata.yml"
        display_cleanup_instructions
        return 1
    fi

    shared_path=$(echo "$core_config" | grep "^oim_shared_path:" | cut -d':' -f2- | tr -d ' \t\n\r')
    if [ -z "$shared_path" ]; then
        echo "[ERROR] [ORCHESTRATOR] oim_shared_path not found in oim_metadata.yml"
        return 1
    fi

    omnia_path="$shared_path"

    if [ ! -d "$omnia_path" ]; then
        echo "[ERROR] [ORCHESTRATOR] Shared path from metadata does not exist on host: $omnia_path"
        return 1
    fi

    if [ ! -w "$omnia_path" ]; then
        echo "[ERROR] [ORCHESTRATOR] Permission denied: no write permission on shared path: $omnia_path"
        return 1
    fi

    echo "[INFO] [ORCHESTRATOR] Phase 1: Validation passed"
    return 0
}

phase2_approval() {
    local backup_base default_backup_dir current_omnia_version

    echo "[INFO] [ORCHESTRATOR] Phase 2: Approval Gate"
    echo "============================================"
    echo "OMNIA UPGRADE SUMMARY"
    echo "============================================"
    echo "Current Container Tag: $OMNIA_CORE_CONTAINER_TAG"
    echo "Target Container Tag:  $TARGET_CONTAINER_TAG"
    echo "Current Omnia Release: $OMNIA_VERSION"
    echo "Target Omnia Release:  $TARGET_OMNIA_VERSION"
    
    # Show upgrade type
    if [ "$OMNIA_CORE_CONTAINER_TAG" = "$TARGET_CONTAINER_TAG" ]; then
        echo "Upgrade Type: Same-tag upgrade (container restart)"
    else
        echo "Upgrade Type: Cross-tag upgrade (container swap)"
    fi
    
    echo "============================================"

    current_omnia_version=$(podman exec -u root omnia_core /bin/bash -c "grep '^omnia_version:' '$CONTAINER_METADATA_FILE' | cut -d':' -f2 | tr -d ' \t\n\r'" 2>/dev/null)
    if [ -z "$current_omnia_version" ]; then
        echo "[ERROR] [ORCHESTRATOR] Failed to read omnia_version from metadata inside container"
        return 1
    fi

    default_backup_dir="$CONTAINER_BACKUPS_DIR/upgrade/version_${current_omnia_version}"
    backup_base="$default_backup_dir"

    echo "[INFO] [ORCHESTRATOR] Backup destination (inside omnia_core container): $backup_base"

    if ! update_metadata_upgrade_backup_dir "$backup_base"; then
        echo "[ERROR] [ORCHESTRATOR] Failed to update upgrade backup directory in metadata"
        return 1
    fi

    read -p "Proceed with upgrade? (y/N): " confirm
    if [ "$confirm" != "y" ] && [ "$confirm" != "Y" ]; then
        echo "[INFO] [ORCHESTRATOR] Upgrade cancelled by user"
        return 1
    fi

    OMNIA_UPGRADE_BACKUP_PATH="$backup_base"
    export OMNIA_UPGRADE_BACKUP_PATH

    echo "[INFO] [ORCHESTRATOR] Phase 2: Approval granted"
    return 0
}

phase3_backup_creation() {
    local backup_base="$1"

    echo "[INFO] [ORCHESTRATOR] Phase 3: Backup Creation"

    if ! podman ps --format '{{.Names}}' | grep -qw "omnia_core"; then
        echo "[ERROR] [ORCHESTRATOR] Cannot create backup because omnia_core is not running"
        return 1
    fi

    if [ -z "$backup_base" ]; then
        echo "[ERROR] [ORCHESTRATOR] Backup destination is empty"
        return 1
    fi

    if ! podman exec -u root omnia_core bash -c "
        set -e
        rm -rf '${backup_base%/}/input' '${backup_base%/}/metadata' '${backup_base%/}/configs'
        mkdir -p '${backup_base%/}/input' '${backup_base%/}/metadata' '${backup_base%/}/configs'

        if [ -f '$CONTAINER_INPUT_DIR/default.yml' ]; then
            cp -a '$CONTAINER_INPUT_DIR/default.yml' '${backup_base%/}/input/'
        fi

        if [ -d '$CONTAINER_INPUT_DIR/project_default' ]; then
            cp -a '$CONTAINER_INPUT_DIR/project_default' '${backup_base%/}/input/'
        fi

        if [ ! -f '$CONTAINER_METADATA_FILE' ]; then
            echo '[ERROR] Metadata file not found inside container: $CONTAINER_METADATA_FILE' >&2
            exit 1
        fi
        cp -a '$CONTAINER_METADATA_FILE' '${backup_base%/}/metadata/oim_metadata.yml'
    "; then
        echo "[ERROR] [ORCHESTRATOR] Backup failed; cleaning up partial backup"
        podman exec -u root omnia_core bash -c "rm -rf '${backup_base%/}/input' '${backup_base%/}/metadata' '${backup_base%/}/configs'" >/dev/null 2>&1 || true
        return 1
    fi

    if [ -f "/etc/containers/systemd/omnia_core.container" ]; then
        if ! podman cp "/etc/containers/systemd/omnia_core.container" "omnia_core:${backup_base%/}/configs/omnia_core.container" >/dev/null 2>&1; then
            echo "[ERROR] [ORCHESTRATOR] Failed to backup quadlet container file"
            podman exec -u root omnia_core bash -c "rm -rf '${backup_base%/}/input' '${backup_base%/}/metadata' '${backup_base%/}/configs'" >/dev/null 2>&1 || true
            return 1
        fi
    fi

    echo "[INFO] [ORCHESTRATOR] Backup created at: $backup_base"
    echo "[INFO] [ORCHESTRATOR] Phase 3: Backup completed"
    return 0
}

phase4_same_tag_upgrade() {
    local target_version="$1"
    
    echo "[INFO] [ORCHESTRATOR] Phase 4: Same-Tag Upgrade"
    echo "[INFO] [ORCHESTRATOR] Upgrading to $target_version within same container tag"
    
    # Verify container is running
    if ! podman ps --format '{{.Names}}' | grep -qw "omnia_core"; then
        echo "[ERROR] [ORCHESTRATOR] Container is not running for same-tag upgrade"
        return 1
    fi
    
    # Get version from git tag or use target version
    local metadata_version=$(get_metadata_version "$target_version")
    echo "[INFO] [ORCHESTRATOR] Updating metadata to version $metadata_version"
    
    # Update version metadata
    if ! podman exec -u root omnia_core bash -c "
        set -e
        if [ ! -f '$CONTAINER_METADATA_FILE' ]; then
            echo '[ERROR] Metadata file not found inside container: $CONTAINER_METADATA_FILE' >&2
            exit 1
        fi
        if grep -q '^omnia_version:' '$CONTAINER_METADATA_FILE'; then
            sed -i 's/^omnia_version:.*/omnia_version: $metadata_version/' '$CONTAINER_METADATA_FILE'
        else
            echo 'omnia_version: $metadata_version' >> '$CONTAINER_METADATA_FILE'
        fi
    "; then
        echo "[ERROR] [ORCHESTRATOR] Failed to update metadata version"
        echo "[ERROR] [ORCHESTRATOR] Upgrade failed: Could not update version metadata"
        return 1
    fi
    
    echo "[INFO] [ORCHESTRATOR] Restarting container to apply changes..."
    
    # Restart container to apply changes
    if ! systemctl restart omnia_core.service; then
        echo "[ERROR] [ORCHESTRATOR] Failed to restart container service"
        echo "[ERROR] [ORCHESTRATOR] Upgrade failed: Container restart failed"
        return 1
    fi
    
    # Wait for container to be healthy after restart
    echo "[INFO] [ORCHESTRATOR] Waiting for container health check after restart (30s)"
    local health_timeout=30
    local health_count=0
    
    while [ $health_count -lt $health_timeout ]; do
        if podman ps --format '{{.Names}} {{.Status}}' | grep -E "omnia_core.*Up" | grep -q "healthy\|Up"; then
            echo "[INFO] [ORCHESTRATOR] Container is healthy after restart"
            break
        fi
        sleep 1
        health_count=$((health_count + 1))
        echo -n "."
    done
    
    if [ $health_count -ge $health_timeout ]; then
        echo ""
        echo "[ERROR] [ORCHESTRATOR] Container failed to become healthy within 30 seconds after restart"
        echo "[ERROR] [ORCHESTRATOR] Upgrade failed: Container health check failed"
        return 1
    fi
    
    # Verify version update
    local updated_version=$(get_current_omnia_version)
    if [ "$updated_version" != "$metadata_version" ]; then
        echo "[ERROR] [ORCHESTRATOR] Version update verification failed"
        echo "[ERROR] [ORCHESTRATOR] Expected: $metadata_version, Found: $updated_version"
        return 1
    fi
    
    echo "[INFO] [ORCHESTRATOR] Same-tag upgrade completed successfully"
    echo "[INFO] [ORCHESTRATOR] Version updated to: $metadata_version"

    # Update metadata with git tag version from inside container
    update_metadata_with_git_tag "$target_version"

    show_post_upgrade_instructions "$target_version"
    
    return 0
}

phase4_container_swap() {
    local quadlet_file="/etc/containers/systemd/omnia_core.container"
    local i

    echo "[INFO] [ORCHESTRATOR] Phase 4: Container Swap"

    if [ ! -f "$quadlet_file" ]; then
        echo "[ERROR] [ORCHESTRATOR] Phase 4.3 failed: Quadlet file not found: $quadlet_file"
        echo "[ERROR] [ORCHESTRATOR] Upgrade failed: Quadlet configuration file missing"
        display_cleanup_instructions
        return 1
    fi

    echo "[INFO] [ORCHESTRATOR] Stopping omnia_core $OMNIA_CORE_CONTAINER_TAG container"
    systemctl stop omnia_core.service >/dev/null 2>&1 || true

    if podman ps --format '{{.Names}}' | grep -qw "omnia_core"; then
        echo "[WARN] [ORCHESTRATOR] omnia_core still running; forcing stop"
        podman stop -t 30 omnia_core >/dev/null 2>&1 || true
    fi

    if podman ps --format '{{.Names}}' | grep -qw "omnia_core"; then
        echo "[ERROR] [ORCHESTRATOR] Failed to stop omnia_core container"
        echo "[ERROR] [ORCHESTRATOR] Upgrade failed: Could not stop $OMNIA_CORE_CONTAINER_TAG container"
        echo "[ERROR] [ORCHESTRATOR] Initiating rollback to restore container..."
        rollback_omnia_core
        return 1
    fi

    echo "[INFO] [ORCHESTRATOR] Starting omnia_core $TARGET_CONTAINER_TAG Quadlet unit"
    if ! podman inspect "omnia_core:$TARGET_CONTAINER_TAG" >/dev/null 2>&1; then
        echo "[ERROR] [ORCHESTRATOR] Target image missing locally: omnia_core:$TARGET_CONTAINER_TAG"
        echo "[ERROR] [ORCHESTRATOR] Upgrade failed: $TARGET_CONTAINER_TAG image not available"
        echo "[ERROR] [ORCHESTRATOR] Initiating rollback to restore container..."
        rollback_omnia_core
        return 1
    fi

    if ! sed -i "s/^Image=omnia_core:.*/Image=omnia_core:$TARGET_CONTAINER_TAG/" "$quadlet_file"; then
        echo "[ERROR] [ORCHESTRATOR] Phase 4.3 failed: Failed to update Image to $TARGET_CONTAINER_TAG in quadlet file"
        echo "[ERROR] [ORCHESTRATOR] Upgrade failed: Could not update container image tag"
        echo "[ERROR] [ORCHESTRATOR] Initiating rollback to restore container..."
        rollback_omnia_core
        return 1
    fi

    systemctl daemon-reload || {
        echo "[ERROR] [ORCHESTRATOR] Phase 4.3 failed: systemctl daemon-reload failed"
        echo "[ERROR] [ORCHESTRATOR] Upgrade failed: System daemon reload failed"
        echo "[ERROR] [ORCHESTRATOR] Initiating rollback to restore container..."
        rollback_omnia_core
        return 1
    }

    systemctl start omnia_core.service || {
        echo "[ERROR] [ORCHESTRATOR] Phase 4.3 failed: Failed to start omnia_core.service"
        echo "[ERROR] [ORCHESTRATOR] Upgrade failed: Could not start $TARGET_CONTAINER_TAG container"
        echo "[ERROR] [ORCHESTRATOR] Initiating rollback to restore container..."
        rollback_omnia_core
        return 1
    }

    echo "[INFO] [ORCHESTRATOR] Waiting for omnia_core $TARGET_CONTAINER_TAG health check (60s)"
    for i in $(seq 1 60); do
        if podman ps --format '{{.Names}}' | grep -qw "omnia_core"; then
            break
        fi
        sleep 1
    done

    if ! podman ps --format '{{.Names}} {{.Status}}' | grep -E "omnia_core.*Up" | grep -q "healthy\|Up"; then
        echo "[ERROR] [ORCHESTRATOR] Phase 4.4 failed: Container failed health check after swap"
        echo "[ERROR] [ORCHESTRATOR] Upgrade failed: $TARGET_CONTAINER_TAG container failed health check"
        echo "[ERROR] [ORCHESTRATOR] Initiating rollback to restore container..."
        rollback_omnia_core
        return 1
    fi

    # Get version from git tag or use target version
    local metadata_version=$(get_metadata_version "$TARGET_OMNIA_VERSION")
    echo "[INFO] [ORCHESTRATOR] Updating metadata omnia_version to $metadata_version"
    if ! podman exec -u root omnia_core bash -c "
        set -e
        if [ ! -f '$CONTAINER_METADATA_FILE' ]; then
            echo '[ERROR] Metadata file not found inside container: $CONTAINER_METADATA_FILE' >&2
            exit 1
        fi
        if grep -q '^omnia_version:' '$CONTAINER_METADATA_FILE'; then
            sed -i 's/^omnia_version:.*/omnia_version: $metadata_version/' '$CONTAINER_METADATA_FILE'
        else
            echo 'omnia_version: $metadata_version' >> '$CONTAINER_METADATA_FILE'
        fi
    "; then
        echo "[ERROR] [ORCHESTRATOR] Phase 4.5 failed: Failed to update metadata version"
        echo "[ERROR] [ORCHESTRATOR] Upgrade failed: Could not update version metadata"
        echo "[ERROR] [ORCHESTRATOR] Initiating rollback to restore container..."
        rollback_omnia_core
        return 1
    fi

    echo "[INFO] [ORCHESTRATOR] Phase 4: Container swap completed"
    # Update metadata with git tag version from inside container
    update_metadata_with_git_tag "$TARGET_OMNIA_VERSION"
    return 0
}

upgrade_omnia_core() {
    # FIRST THING: Check if user has root privileges
    if [ "$(id -u)" -ne 0 ]; then
        echo -e "${RED}ERROR: Upgrade requires root or sudo privileges${NC}"
        echo -e "${YELLOW}Please run this script with sudo or login as root user.${NC}"
        echo -e "${YELLOW}Example: sudo $0 --upgrade${NC}"
        exit 1
    fi
    
    echo -e "${BLUE}=================== Omnia Core Upgrade ====================${NC}"
    echo -e "${BLUE}This script will upgrade Omnia core container.${NC}"
    echo -e "${BLUE}Current version will be backed up and upgraded to target version.${NC}"
    echo -e "${BLUE}=============================================================${NC}"
    
    # Read current version
    OMNIA_VERSION=$(get_current_omnia_version)
    if [ -z "$OMNIA_VERSION" ]; then
        echo -e "${RED}ERROR: Could not determine current Omnia version${NC}"
        echo -e "${YELLOW}Please ensure omnia_core container is running and metadata is accessible${NC}"
        display_cleanup_instructions
        exit 1
    fi
    
    # Get current container tag
    OMNIA_CORE_CONTAINER_TAG=$(get_container_tag_from_version "$OMNIA_VERSION")
    
    echo -e "${GREEN}Current Omnia version: $OMNIA_VERSION${NC}"
    echo -e "${GREEN}Current container tag: $OMNIA_CORE_CONTAINER_TAG${NC}"
    
    # Show available upgrade options
    echo ""
    echo "Available upgrade options:"
    echo "========================="
    
    # Get available upgrade versions dynamically
    local upgrade_output
    upgrade_output=$(get_available_upgrade_versions "$OMNIA_VERSION")
    
    # Parse output into versions and descriptions
    local available_versions=()
    local version_descriptions=()
    local line_count=0
    local total_lines
    
    # Count total lines
    total_lines=$(echo "$upgrade_output" | wc -l)
    
    # Split into versions and descriptions (first half = versions, second half = descriptions)
    local mid_line=$((total_lines / 2))
    local line_num=0
    
    while IFS= read -r line; do
        line_num=$((line_num + 1))
        if [ $line_num -le $mid_line ]; then
            available_versions+=("$line")
        else
            version_descriptions+=("$line")
        fi
    done <<< "$upgrade_output"
    
    # Check if any upgrade options are available
    if [ ${#available_versions[@]} -eq 0 ]; then
        echo -e "${GREEN}Already at latest version $OMNIA_VERSION${NC}"
        echo "No upgrade options available."
        exit 0
    fi
    
    # Display upgrade options
    for i in "${!available_versions[@]}"; do
        local target_version="${available_versions[$i]}"
        local target_container_tag=$(get_container_tag_from_version "$target_version")
        
        # Check if target image exists locally
        local image_status="✓ Available"
        if ! podman inspect "omnia_core:$target_container_tag" >/dev/null 2>&1; then
            image_status="✗ Missing (build required)"
        fi
        
        echo "$((i+1)). Upgrade to $target_version (container tag: $target_container_tag) [$image_status]"
    done
    
    # Prompt user to select upgrade version
    echo -n "Select upgrade option (1-${#available_versions[@]}) or press Enter to cancel: "
    read -r selection
    
    # Validate selection
    if [ -z "$selection" ]; then
        echo "Upgrade cancelled by user."
        exit 0
    fi
    
    if ! [[ "$selection" =~ ^[0-9]+$ ]] || [ "$selection" -lt 1 ] || [ "$selection" -gt ${#available_versions[@]} ]; then
        echo -e "${RED}ERROR: Invalid selection.${NC}"
        exit 1
    fi
    
    # Set target version based on user selection
    TARGET_OMNIA_VERSION="${available_versions[$((selection-1))]}"
    TARGET_CONTAINER_TAG=$(get_container_tag_from_version "$TARGET_OMNIA_VERSION")
    
    # Pre-validation: Check if target container image exists locally
    if ! validate_container_image "$TARGET_OMNIA_VERSION" "$TARGET_CONTAINER_TAG" "upgrade"; then
        exit 1
    fi
    
    echo -e "${GREEN}Target Omnia version: $TARGET_OMNIA_VERSION${NC}"
    echo -e "${GREEN}Target container tag: $TARGET_CONTAINER_TAG${NC}"
    
    # Check if container tag change is needed
    if [ "$OMNIA_CORE_CONTAINER_TAG" = "$TARGET_CONTAINER_TAG" ]; then
        echo -e "${BLUE}Upgrade within same container tag ($TARGET_CONTAINER_TAG)${NC}"
        echo -e "${BLUE}Will restart container instead of swapping${NC}"
        SAME_TAG_UPGRADE=true
    else
        echo -e "${BLUE}Container tag change required ($OMNIA_CORE_CONTAINER_TAG -> $TARGET_CONTAINER_TAG)${NC}"
        echo -e "${BLUE}Will perform full container swap${NC}"
        SAME_TAG_UPGRADE=false
    fi
    
    # Pre-validation: Check if target container image exists locally
    if ! validate_container_image "$TARGET_OMNIA_VERSION" "$TARGET_CONTAINER_TAG" "upgrade"; then
        exit 1
    fi
    local lock_file="/tmp/omnia_upgrade.lock"
    if [ -f "$lock_file" ]; then
        echo -e "${RED}ERROR: Another upgrade process is already running${NC}"
        echo -e "${YELLOW}If this is incorrect, remove the lock file: rm -f $lock_file${NC}"
        exit 1
    fi
    touch "$lock_file"
    trap 'rm -f "$lock_file"' EXIT

    # Create upgrade guard lock in shared path so other playbooks can block during upgrade
    local upgrade_guard_lock_path
    upgrade_guard_lock_path=$(get_upgrade_guard_lock_path)

    mkdir -p "$(dirname "$upgrade_guard_lock_path")" 2>/dev/null || true
    echo "Upgrade in progress. Complete upgrade_omnia.yml or rollback to clear." > "$upgrade_guard_lock_path" || {
        echo -e "${RED}ERROR: Failed to create upgrade guard lock: $upgrade_guard_lock_path${NC}"
        exit 1
    }

    # Run upgrade phases
    if ! phase1_validate; then
        echo "[ERROR] [ORCHESTRATOR] Upgrade failed in Phase 1"
        exit 1
    fi

    if ! phase2_approval; then
        exit 0
    fi

    local backup_base="$OMNIA_UPGRADE_BACKUP_PATH"
    if [ -z "$backup_base" ]; then
        echo "[ERROR] [ORCHESTRATOR] Backup path is empty"
        exit 1
    fi

    if ! phase3_backup_creation "$backup_base"; then
        echo "[ERROR] [ORCHESTRATOR] Upgrade failed in Phase 3"
        exit 1
    fi

    # Choose upgrade path based on container tag
    if [ "$SAME_TAG_UPGRADE" = "true" ]; then
        if ! phase4_same_tag_upgrade "$TARGET_OMNIA_VERSION"; then
            echo "[ERROR] [ORCHESTRATOR] Upgrade failed in same-tag upgrade"
            exit 1
        fi
    else
        if ! phase4_container_swap; then
            echo "[ERROR] [ORCHESTRATOR] Upgrade failed in Phase 4"
            exit 1
        fi
    fi

    echo "[INFO] [ORCHESTRATOR] Upgrade completed successfully"
    echo "[INFO] [ORCHESTRATOR] Backup location (inside omnia_core container): $backup_base"

    # Seed inputs and defaults after upgrade
    post_setup_config

    echo ""
    echo -e "${GREEN}================================================================================${NC}"
    echo -e "${GREEN}                    UPGRADE COMPLETED SUCCESSFULLY${NC}"
    echo -e "${GREEN}================================================================================${NC}"
    echo ""
    echo -e "${GREEN}✓ Omnia core has been upgraded to version $TARGET_OMNIA_VERSION${NC}"
    echo -e "${GREEN}✓ Container is running and healthy${NC}"
    echo -e "${GREEN}✓ Configuration backed up to: $backup_base${NC}"
    echo ""

    show_post_upgrade_instructions "$TARGET_OMNIA_VERSION"
    # Initialize SSH config and start container session
    init_ssh_config
    remove_container_omnia_sh
    start_container_session
    exit 0
}

# Validate backup directory structure and files
validate_backup_directory() {
    local backup_path="$1"

    echo "[INFO] [ROLLBACK] Validating backup directory: $backup_path"

    # Check if backup directory exists
    if ! podman exec -u root omnia_core test -d "$backup_path"; then
        echo "[ERROR] [ROLLBACK] Backup directory does not exist: $backup_path"
        return 1
    fi

    # Check for required subdirectories
    for subdir in input metadata configs; do
        if ! podman exec -u root omnia_core test -d "$backup_path/$subdir"; then
            echo "[ERROR] [ROLLBACK] Missing required subdirectory: $backup_path/$subdir"
            return 1
        fi
    done

    # Check for required files
    if ! podman exec -u root omnia_core test -f "$backup_path/metadata/oim_metadata.yml"; then
        echo "[ERROR] [ROLLBACK] Missing metadata file: $backup_path/metadata/oim_metadata.yml"
        return 1
    fi

    if ! podman exec -u root omnia_core test -f "$backup_path/configs/omnia_core.container"; then
        echo "[ERROR] [ROLLBACK] Missing container config: $backup_path/configs/omnia_core.container"
        return 1
    fi

    # Verify metadata contains version information
    if ! podman exec -u root omnia_core grep -q "^omnia_version:" "$backup_path/metadata/oim_metadata.yml"; then
        echo "[ERROR] [ROLLBACK] Metadata file does not contain version information"
        return 1
    fi

    echo "[INFO] [ROLLBACK] Backup validation successful"
    return 0
}

# Stop container gracefully with timeout
stop_container_gracefully() {
    local container_name="$1"
    local timeout="${2:-30}"

    echo "[INFO] [ROLLBACK] Stopping $container_name container gracefully..."

    # Try graceful stop first
    if podman stop -t "$timeout" "$container_name" >/dev/null 2>&1; then
        echo "[INFO] [ROLLBACK] Container stopped gracefully"
        return 0
    fi

    # Check if container is still running
    if podman ps --format '{{.Names}}' | grep -qw "$container_name"; then
        echo "[WARN] [ROLLBACK] Graceful stop failed, force stopping container..."
        if podman stop "$container_name" >/dev/null 2>&1; then
            echo "[INFO] [ROLLBACK] Container force stopped"
            return 0
        else
            echo "[ERROR] [ROLLBACK] Failed to stop container"
            return 1
        fi
    fi

    return 0
}

# Restore files from backup
restore_from_backup() {
    local backup_path="$1"

    echo "[INFO] [ROLLBACK] Restoring from backup: $backup_path"

    # Restore input files
    if ! podman exec -u root omnia_core bash -c "
        set -e
        rm -rf /opt/omnia/input
        cp -a '$backup_path/input' /opt/omnia/
    "; then
        echo "[ERROR] [ROLLBACK] Failed to restore input files"
        return 1
    fi

    # Restore metadata
    if ! podman exec -u root omnia_core cp -a "$backup_path/metadata/oim_metadata.yml" /opt/omnia/.data/; then
        echo "[ERROR] [ROLLBACK] Failed to restore metadata"
        return 1
    fi

    # Restore container config on host
    if ! podman cp "omnia_core:$backup_path/configs/omnia_core.container" /etc/containers/systemd/; then
        echo "[ERROR] [ROLLBACK] Failed to restore container config"
        return 1
    fi

    echo "[INFO] [ROLLBACK] Files restored successfully"
    return 0
}

# Display cleanup instructions for failed upgrade/rollback
display_cleanup_instructions() {
    echo ""
    echo -e "${RED}================================================================================${NC}"
    echo -e "${RED}                    UPGRADE/ROLLBACK FAILED${NC}"
    echo -e "${RED}================================================================================${NC}"
    echo ""
    echo -e "${YELLOW}Operation failed. Manual cleanup is required to restore a clean state before retrying.${NC}"
    echo ""
    echo -e "${BLUE}Choose the appropriate cleanup scenario:${NC}"
    echo ""
    echo -e "${GREEN}CASE 1: If you can log into omnia_core container:${NC}"
    echo -e "${YELLOW}1. Enter omnia_core container: podman exec -it omnia_core bash${NC}"
    echo -e "${YELLOW}2. Run oim cleanup: ansible-playbook /omnia/oim_cleanup.yml${NC}"
    echo -e "${YELLOW}3. Run uninstall inside container: ./omnia.sh --uninstall${NC}"
    echo -e "${YELLOW}4. Exit container: exit${NC}"
    echo -e "${YELLOW}5. Clean shared path: rm -rf <omnia_shared_path>${NC}"
    echo -e "${YELLOW}6. Install required version: ./omnia.sh --install${NC}"
    echo ""
    echo -e "${GREEN}CASE 2: If you cannot log into omnia_core container (but other containers are running):${NC}"
    echo -e "${YELLOW}1. Remove all container definitions: cd /etc/containers/systemd${NC}"
    echo -e "${YELLOW}2. Delete all container files: rm -rf *${NC}"
    echo -e "${YELLOW}3. Reload systemd daemon: systemctl daemon-reload${NC}"
    echo -e "${YELLOW}4. Stop all containers: podman stop $(podman ps -aq)${NC}"
    echo -e "${YELLOW}5. Remove all containers: podman rm -f $(podman ps -aq)${NC}"
    echo -e "${YELLOW}6. Clean shared path: rm -rf <omnia_shared_path>${NC}"
    echo -e "${YELLOW}7. Install required version: ./omnia.sh --install${NC}"
    echo ""
    echo -e "${BLUE}Note: Replace <omnia_shared_path> with your actual Omnia shared path.${NC}"
    echo ""
}

rollback_omnia_core() {
    # FIRST THING: Check if user has root privileges
    if [ "$(id -u)" -ne 0 ]; then
        echo -e "${RED}ERROR: Upgrade requires root or sudo privileges${NC}"
        echo -e "${YELLOW}Please run this script with sudo or login as root user.${NC}"
        echo -e "${YELLOW}Example: sudo $0 --rollback${NC}"
        exit 1
    fi
    
    echo -e "${GREEN}================================================================================${NC}"
    echo -e "${GREEN}                         OMNIA CORE ROLLBACK${NC}"
    echo -e "${GREEN}================================================================================${NC}"
    echo ""
    
    # Audit log start
    local rollback_start=$(date -Iseconds)
    echo "[AUDIT] Rollback operation started at: $rollback_start"
    
    # Check if omnia_core container is running
    if ! podman ps --format '{{.Names}}' | grep -qw "omnia_core"; then
        echo -e "${RED}ERROR: Omnia core container is not running.${NC}"
        exit 1
    fi
    
    # Create lock file to prevent concurrent rollbacks
    local lock_file="/tmp/omnia_rollback.lock"
    if [ -f "$lock_file" ]; then
        local existing_pid
        existing_pid=$(cat "$lock_file" 2>/dev/null | tr -d ' \t\n\r')

        if [ -n "$existing_pid" ] && kill -0 "$existing_pid" >/dev/null 2>&1; then
            echo -e "${RED}ERROR: Another rollback process is already running (PID: $existing_pid)${NC}"
            echo -e "${YELLOW}If this is incorrect, remove the lock file: rm -f $lock_file${NC}"
            exit 1
        fi

        if [ -n "$existing_pid" ]; then
            echo -e "${YELLOW}[WARN] Stale rollback lock file found (PID: $existing_pid); removing: $lock_file${NC}"
        fi
        rm -f "$lock_file" >/dev/null 2>&1 || true
    fi

    echo "$$" > "$lock_file"
    trap 'rm -f "$lock_file"' EXIT INT TERM
    
    # Get current version
    if ! podman exec -u root omnia_core test -f "/opt/omnia/.data/oim_metadata.yml"; then
        echo -e "${RED}ERROR: Metadata file not found: /opt/omnia/.data/oim_metadata.yml${NC}"
        exit 1
    fi
    
    local current_version=$(podman exec -u root omnia_core grep '^omnia_version:' /opt/omnia/.data/oim_metadata.yml 2>/dev/null | cut -d':' -f2 | tr -d ' \t\n\r')
    
    # Use upgrade_backup_dir from metadata as the authoritative rollback target
    local selected_backup
    selected_backup=$(podman exec -u root omnia_core grep '^upgrade_backup_dir:' /opt/omnia/.data/oim_metadata.yml 2>/dev/null | cut -d':' -f2- | tr -d ' \t\n\r')
    if [ -z "$selected_backup" ]; then
        echo -e "${RED}ERROR: upgrade_backup_dir not found in metadata; cannot determine rollback target.${NC}"
        exit 1
    fi

    local selected_version
    selected_version=$(echo "$selected_backup" | sed -n 's/.*version_\([^/]*\).*/\1/p')
    if [ -z "$selected_version" ]; then
        echo -e "${RED}ERROR: Could not derive rollback version from upgrade_backup_dir: $selected_backup${NC}"
        exit 1
    fi

    local selected_container_tag=$(get_container_tag_from_version "$selected_version")
    local current_container_tag=$(get_container_tag_from_version "$current_version")

    # Check if target image exists locally and inform user before confirmation
    local image_status="✓ Available"
    if ! podman inspect "omnia_core:$selected_container_tag" >/dev/null 2>&1; then
        image_status="✗ Missing (build required)"
        echo -e "${RED}ERROR: Required image omnia_core:$selected_container_tag is not available locally.${NC}"
        echo -e "${YELLOW}Please build or load the image before retrying rollback.${NC}"
        exit 1
    fi

    echo ""
    echo "Rollback target derived from metadata:"
    echo "  - Version: $selected_version"
    echo "  - Backup path: $selected_backup"
    echo "  - Container tag: $selected_container_tag ($image_status)"
    echo -n "Proceed with rollback using this backup? [y/N]: "
    read -r confirm
    if [[ ! "$confirm" =~ ^[yY] ]]; then
        echo "Rollback cancelled by user."
        exit 0
    fi

    # Pre-validation: Check if target container image exists locally
    if ! validate_container_image "$selected_version" "$selected_container_tag" "rollback"; then
        exit 1
    fi

    # Validate selected backup exists
    if ! podman exec -u root omnia_core test -d "$selected_backup" 2>/dev/null; then
        echo -e "${RED}ERROR: Backup directory does not exist: $selected_backup${NC}"
        exit 1
    fi

    echo ""
    if [ "$current_container_tag" = "$selected_container_tag" ]; then
        echo -e "${BLUE}Rollback within same container tag ($selected_container_tag)${NC}"
        echo -e "${BLUE}Will restart container instead of swapping${NC}"

        # Perform same-tag rollback (container restart only)
        if ! rollback_same_tag "$selected_version" "$current_version"; then
            echo "[ERROR] [ROLLBACK] Rollback failed in same-tag rollback"
            exit 1
        fi

        echo "[INFO] [ROLLBACK] Rollback completed successfully"
        echo "[INFO] [ROLLBACK] Version rolled back to: $selected_version"
        exit 0
    else
        echo -e "${BLUE}Container tag change: ${current_container_tag} -> ${selected_container_tag}${NC}"
        echo "[INFO] [ROLLBACK] Starting rollback process..."
    fi

    # Capture metadata version from backup for later verification
    local backup_metadata_version
    backup_metadata_version=$(podman exec -u root omnia_core grep '^omnia_version:' "$selected_backup/metadata/oim_metadata.yml" 2>/dev/null | cut -d':' -f2 | tr -d ' \t\n\r')
    if [ -z "$backup_metadata_version" ]; then
        echo -e "${RED}ERROR: Backup metadata does not contain omnia_version in $selected_backup/metadata/oim_metadata.yml${NC}"
        exit 1
    fi

    echo ""
    echo "[INFO] [ROLLBACK] Starting rollback process..."
    
    # Step 1: Stop current container gracefully
    echo ""
    echo "[INFO] [ROLLBACK] Step 1: Stopping Omnia core $current_container_tag container..."
    if ! stop_container_gracefully "omnia_core" 30; then
        echo -e "${RED}ERROR: Failed to stop container.${NC}"
        display_cleanup_instructions
        exit 1
    fi
    
    # Step 2: Update Quadlet file to use target container tag
    echo ""
    echo "[INFO] [ROLLBACK] Step 2: Updating Quadlet file to use container tag $selected_container_tag..."
    local quadlet_file="/etc/containers/systemd/omnia_core.container"
    
    if ! sed -i "s/^Image=omnia_core:.*/Image=omnia_core:$selected_container_tag/" "$quadlet_file"; then
        echo -e "${RED}ERROR: Failed to update Image to $selected_container_tag in quadlet file${NC}"
        display_cleanup_instructions
        exit 1
    fi
    
    echo "[INFO] [ROLLBACK] Quadlet file updated to use omnia_core:$selected_container_tag"
    
    # Step 3: Start target container
    echo ""
    echo "[INFO] [ROLLBACK] Step 3: Starting Omnia core $selected_container_tag container..."
    systemctl daemon-reload
    if ! systemctl start omnia_core.service; then
        echo -e "${RED}ERROR: Failed to start container service.${NC}"
        display_cleanup_instructions
        exit 1
    fi
    
    # Step 4: Wait for container to be healthy
    echo ""
    echo "[INFO] [ROLLBACK] Step 4: Waiting for container to be healthy..."
    local health_timeout=60
    local health_count=0
    
    while [ $health_count -lt $health_timeout ]; do
        if podman ps --format '{{.Names}} {{.Status}}' | grep -E "omnia_core.*Up" | grep -q "healthy\|Up"; then
            echo "[INFO] [ROLLBACK] Container is healthy"
            break
        fi
        sleep 1
        health_count=$((health_count + 1))
        echo -n "."
    done
    
    if [ $health_count -ge $health_timeout ]; then
        echo ""
        echo -e "${RED}ERROR: Container failed to become healthy within 60 seconds.${NC}"
        display_cleanup_instructions
        exit 1
    fi
    
    # Step 5: Validate backup directory structure
    echo ""
    echo "[INFO] [ROLLBACK] Step 5: Validating backup directory structure..."
    if ! validate_backup_directory "$selected_backup"; then
        echo -e "${RED}ERROR: Backup validation failed.${NC}"
        display_cleanup_instructions
        exit 1
    fi
    
    # Step 6: Restore files from backup
    echo ""
    echo "[INFO] [ROLLBACK] Step 6: Restoring files from backup..."
    if ! restore_from_backup "$selected_backup"; then
        echo -e "${RED}ERROR: Failed to restore from backup.${NC}"
        display_cleanup_instructions
        exit 1
    fi
    
    # Step 7: Verify container version
    echo ""
    echo "[INFO] [ROLLBACK] Step 7: Verifying container version from restored metadata..."
    local verify_version=$(podman exec -u root omnia_core grep '^omnia_version:' /opt/omnia/.data/oim_metadata.yml 2>/dev/null | cut -d':' -f2 | tr -d ' \t\n\r')
    
    if [ "$verify_version" != "$backup_metadata_version" ]; then
        echo -e "${RED}ERROR: Version verification failed. Expected: $backup_metadata_version, Found: $verify_version${NC}"
        display_cleanup_instructions
        exit 1
    fi
    
    # Audit log end
    local rollback_end=$(date -Iseconds)
    echo "[AUDIT] Rollback operation completed at: $rollback_end"
    echo "[AUDIT] Rolled back from version $current_version to $selected_version"
    
    echo ""
    echo -e "${GREEN}================================================================================${NC}"
    echo -e "${GREEN}                    ROLLBACK COMPLETED SUCCESSFULLY${NC}"
    echo -e "${GREEN}================================================================================${NC}"
    echo ""
    echo -e "${GREEN}✓ Omnia core has been rolled back to version $selected_version${NC}"
    echo -e "${GREEN}✓ Container is running and healthy${NC}"
    echo -e "${GREEN}✓ Configuration restored from backup${NC}"
    echo ""

    # Update metadata with git tag version from inside container
    update_metadata_with_git_tag "$selected_version"
    
    # Clean up lock file before starting long-running ssh session
    rm -f "$lock_file" >/dev/null 2>&1 || true
    echo "[INFO] Rollback lock file removed before starting container session"

    # Clear upgrade guard lock if it exists (shared path visible to container and host)
    local upgrade_guard_lock_path
    upgrade_guard_lock_path=$(get_upgrade_guard_lock_path)

    rm -f "$upgrade_guard_lock_path" >/dev/null 2>&1 || true
    echo "[INFO] [ROLLBACK] Cleared upgrade guard lock: $upgrade_guard_lock_path"

    # Initialize SSH config and start container session
    init_ssh_config
    remove_container_omnia_sh
    start_container_session
}

# Main function to check if omnia_core container is already running.
# If yes, ask the user if they want to enter the container or reinstall.
# If no, set it up.
main() {
    case "$1" in
        --install|-i)
            install_omnia_core
            ;;
        --uninstall|-u)
            cleanup_omnia_core
            ;;
        --upgrade)
            upgrade_omnia_core
            ;;
        --rollback)
            rollback_omnia_core
            ;;
        --version|-v)
            display_version
            ;;
        --help|-h|"")
            show_help
            ;;
        *)
            echo "Unknown option: $1"
            show_help
            exit 1
            ;;
    esac
}

# Call the main function
main "$1"


================================================
FILE: prepare_oim/ansible.cfg
================================================
[defaults]
log_path = /opt/omnia/log/core/playbooks/prepare_oim.log
remote_tmp = /opt/omnia/tmp/.ansible/tmp/
host_key_checking = false
forks = 5
timeout = 180
executable = /bin/bash
library = ../common/library/modules
module_utils = ../common/library/module_utils

[persistent_connection]
command_timeout = 180
connect_timeout = 180

[ssh_connection]
retries = 3
ssh_args = -o ControlMaster=auto -o ControlPersist=60 -o ConnectTimeout=60


================================================
FILE: prepare_oim/prepare_oim.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Check if upgrade is in progress
  ansible.builtin.import_playbook: ../utils/upgrade_checkup.yml

- name: Include input project directory
  when: not project_dir_status | default(false) | bool
  ansible.builtin.import_playbook: ../utils/include_input_dir.yml
  tags: always

- name: Set_fact for fetch omnia config credentials
  hosts: localhost
  connection: local
  tags: always
  tasks:
    - name: Set dynamic run tags including 'prepare_oim'
      ansible.builtin.set_fact:
        omnia_run_tags: >-
          {{
            (
              ansible_run_tags | default([]) +
              ['prepare_oim', 'provision', 'local_repo']
            ) | unique
          }}
        cacheable: true

    - name: Read software_config.json to check for additional services
      block:
        - name: Validate software_config.json using input validation
          ansible.builtin.include_role:
            name: ../input_validation/roles/validate_input
          vars:
            input_dir: "{{ input_project_dir }}"
            input_validate_tags: ["software_config"]
          register: software_config_validation

        - name: Load software_config.json
          when:
            - software_config_validation is defined
            - not software_config_validation.failed | default(false)
          block:
            - name: Load software_config.json
              ansible.builtin.include_vars:
                file: "{{ input_project_dir }}/software_config.json"
                name: software_config
              no_log: true
              failed_when: false
              register: software_config_load

        - name: Set software names list
          ansible.builtin.set_fact:
            sw_names: "{{ software_config.softwares | map(attribute='name') | list }}"

        - name: Add service-specific tags based on software presence
          ansible.builtin.set_fact:
            omnia_run_tags: >-
              {%- set tags = omnia_run_tags | default([]) | list -%}
              {%- if 'openldap' in sw_names %}{% set _ = tags.append('openldap') %}{% endif -%}
              {%- if 'slurm' in sw_names %}{% set _ = tags.append('slurm') %}{% endif -%}
              {%- if 'slurm_custom' in sw_names %}{% set _ = tags.append('slurm_custom') %}{% endif -%}
              {%- if 'csi_driver_powerscale' in sw_names %}{% set _ = tags.append('csi_driver_powerscale') %}{% endif -%}
              {%- if 'ldms' in sw_names %}{% set _ = tags.append('ldms') %}{% endif -%}
              {%- if 'service_k8s' in sw_names %}{% set _ = tags.append('service_k8s') %}{% endif -%}
              {{ tags | unique }}

        - name: Check telemetry configuration and add idrac_telemetry tag if enabled
          block:
            - name: Check if telemetry_config.yml exists
              ansible.builtin.stat:
                path: "{{ input_project_dir }}/telemetry_config.yml"
              register: telemetry_config_stat

            - name: Load telemetry_config.yml
              ansible.builtin.include_vars:
                file: "{{ input_project_dir }}/telemetry_config.yml"
                name: telemetry_config
              when: telemetry_config_stat.stat.exists

            - name: Add telemetry tag if idrac_telemetry_support is enabled
              ansible.builtin.set_fact:
                omnia_run_tags: >-
                  {{
                    (omnia_run_tags | default([]) | list + ['telemetry']) | unique
                  }}
              when:
                - telemetry_config_stat.stat.exists
                - telemetry_config.idrac_telemetry_support | default(false) | bool

- name: Invoke validate_config.yml to perform L1 and L2 validations with prepare_oim tag
  ansible.builtin.import_playbook: ../input_validation/validate_config.yml
  tags: always

- name: Invoke get_config_credentials.yml
  ansible.builtin.import_playbook: ../utils/credential_utility/get_config_credentials.yml

- name: Create oim group and provision group
  ansible.builtin.import_playbook: ../utils/create_container_group.yml
  vars:
    oim_group: true
  tags: always

- name: Prepare OIM Validation and Configure Known Hosts
  hosts: localhost
  connection: local
  gather_facts: false
  tags: always
  tasks:
    - name: Include prepare_oim_validation role  # noqa:role-name[path]
      ansible.builtin.include_role:
        name: prepare_oim_validation

- name: Prepare OIM Validation and Configure Known Hosts
  hosts: localhost
  connection: local
  gather_facts: false
  tags: always
  tasks:
    - name: Add OIM to known hosts  # noqa:role-name[path]
      ansible.builtin.include_role:
        name: deploy_containers/common
        tasks_from: add_known_hosts.yml

    - name: Download aarch64 prerequisites  # noqa:role-name[path]
      ansible.builtin.include_role:
        name: deploy_containers/common
        tasks_from: aarch64_prereq.yml

- name: OpenLDAP Pre_req generate ssha password
  hosts: localhost
  connection: local
  gather_facts: false
  tags: auth
  tasks:
    - name: Generate LDAP password hashes  # noqa:role-name[path]
      ansible.builtin.include_role:
        name: deploy_containers/auth
        tasks_from: generate_ldap_password_hashes.yml

- name: Load build_stream configuration
  hosts: localhost
  connection: local
  gather_facts: false
  tags: always
  tasks:
    - name: Include build_stream config file
      ansible.builtin.include_vars:
        file: "{{ input_project_dir }}/build_stream_config.yml"
      failed_when: false

- name: Deploy containers
  hosts: oim
  connection: ssh
  gather_facts: false
  roles:
    - role: deploy_containers/common  # noqa:role-name[path]
      tags: always
    - role: deploy_containers/pulp  # noqa:role-name[path]
      tags: pulp
    - role: deploy_containers/auth  # noqa:role-name[path]
      tags: auth

- name: Verify openchami install status
  hosts: oim
  connection: ssh
  gather_facts: false
  tags: openchami
  tasks:
    - name: Verify openchami installation
      ansible.builtin.include_role:
        name: deploy_containers/openchami  # noqa:role-name[path]
        tasks_from: verify_openchami.yml

- name: OpenCHAMI deployment prereq
  hosts: oim
  connection: ssh
  gather_facts: false
  tags: openchami
  tasks:
    - name: Pull OpenCHAMI images
      ansible.builtin.include_role:
        name: deploy_containers/openchami  # noqa:role-name[path]
        tasks_from: deployment_prereq.yml

- name: Deploy the openchami container
  hosts: localhost
  connection: local
  gather_facts: false
  roles:
    - role: deploy_containers/openchami  # noqa:role-name[path]
      tags: openchami

- name: Configure Pulp container
  hosts: localhost
  connection: local
  tags: pulp
  tasks:
    - name: Configure Pulp container based on protocol
      block:
        - name: Configure Pulp HTTP container tasks
          ansible.builtin.include_role:
            name: deploy_containers/pulp
            tasks_from: create_pulp_config_http.yml
          when: not hostvars['oim']['pulp_protocol_https']

        - name: Configure Pulp HTTPS container tasks
          ansible.builtin.include_role:
            name: deploy_containers/pulp
            tasks_from: create_pulp_config_https.yml
          when: hostvars['oim']['pulp_protocol_https']

- name: Reload pulp nginx
  hosts: oim
  connection: ssh
  tags: pulp
  tasks:
    - name: Reload pulp nginx # noqa:role-name[path]
      ansible.builtin.include_role:
        name: deploy_containers/pulp
        tasks_from: reload_pulp_nginx.yml
      when: hostvars['oim']['pulp_protocol_https']

- name: Deploy postgres container
  hosts: oim
  connection: ssh
  gather_facts: false
  tags: postgres
  roles:
    - role: deploy_containers/postgres  # noqa:role-name[path]
      when: hostvars['localhost']['enable_build_stream'] | default(false) | bool

- name: Deploy build_stream container
  hosts: oim
  connection: ssh
  gather_facts: false
  tags: build_stream
  roles:
    - role: deploy_containers/build_stream  # noqa:role-name[path]
      when: hostvars['localhost']['enable_build_stream'] | default(false) | bool

- name: Omnia service deployment
  hosts: oim
  connection: ssh
  tags: always
  tasks:
    - name: Omnia service deployment # noqa:role-name[path]
      ansible.builtin.include_role:
        name: deploy_containers/common
        tasks_from: omnia_service.yml

    - name: Install required packages  # noqa:role-name[path]
      ansible.builtin.include_role:
        name: deploy_containers/common
        tasks_from: package_installation.yml

- name: Prepare oim completion
  hosts: localhost
  connection: local
  tags: always
  tasks:
    - name: Prepare oim has completed  # noqa:role-name[path]
      ansible.builtin.include_role:
        name: deploy_containers/common
        tasks_from: prepare_oim_completion.yml


================================================
FILE: prepare_oim/roles/deploy_containers/auth/files/bootstrap.ldif
================================================
dn: dc=omnia,dc=test
objectClass: top
objectClass: dcObject
objectClass: organization
o: Omnia Test
dc: omnia

dn: cn=admin,dc=omnia,dc=test
objectClass: simpleSecurityObject
objectClass: organizationalRole
cn: admin
description: Directory Administrator
userPassword: {SSHA}CcEj20AyhrDhWhFGlu01HWnn8eKP1sH3


================================================
FILE: prepare_oim/roles/deploy_containers/auth/files/slapd.conf
================================================
include         /etc/openldap/schema/core.schema
include         /etc/openldap/schema/cosine.schema
include         /etc/openldap/schema/nis.schema
include         /etc/openldap/schema/inetorgperson.schema

pidfile         /var/run/openldap/slapd.pid
argsfile        /var/run/openldap/slapd.args

TLSCertificateFile /etc/openldap/certs/ldapserver.crt
TLSCertificateKeyFile /etc/openldap/certs/ldapserver.key
TLSCACertificateFile /etc/openldap/certs/ldapserver.crt

database        mdb
maxsize         1073741824
suffix          "dc=omnia,dc=test"
rootdn          "cn=admin,dc=omnia,dc=test"
rootpw          {SSHA}CcEj20AyhrDhWhFGlu01HWnn8eKP1sH3

directory       /var/lib/openldap/openldap-data

access to attrs=userPassword
        by self write
        by anonymous auth
        by dn="cn=admin,dc=omnia,dc=test" write
        by * none

access to *
        by self read
        by dn="cn=admin,dc=omnia,dc=test" write
        by * read


================================================
FILE: prepare_oim/roles/deploy_containers/auth/tasks/configure_bootstrap_ldif.yml
================================================
#  Copyright 2024 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Extract only the first part of the domain
  ansible.builtin.set_fact:
    domain_prefix: "{{ domain_name.split('.')[0] }}"

- name: Update bootstrap.ldif file auth service deployment
  block:

    - name: Copy bootstrap.ldif file
      ansible.builtin.copy:
        src: "{{ role_path }}/files/bootstrap.ldif"
        dest: "{{ bootstrap_ldif_dest }}"
        remote_src: false
        mode: "{{ file_permissions_644 }}"
        owner: "root"

    - name: Update the domain name
      ansible.builtin.replace:
        path: "{{ bootstrap_ldif_dest }}"
        regexp: "{{ suffix_regexp }}"
        replace: "{{ reqd_domain_name }}"

    - name: Update the db config name
      ansible.builtin.replace:
        path: "{{ bootstrap_ldif_dest }}"
        regexp: "{{ db_config_name_regexp }}"
        replace: "cn={{ hostvars['127.0.0.1']['openldap_db_username'] }}"

    - name: Update the domain domain_component
      ansible.builtin.replace:
        path: "{{ bootstrap_ldif_dest }}"
        regexp: "{{ domain_component }}"
        replace: "dc: {{ domain_prefix }}"

    - name: Update the comman name
      ansible.builtin.replace:
        path: "{{ bootstrap_ldif_dest }}"
        regexp: "{{ common_name_regexp }}"
        replace: "cn: {{ hostvars['127.0.0.1']['openldap_db_username'] }}"

    - name: Update the SHA password
      ansible.builtin.replace:
        path: "{{ bootstrap_ldif_dest }}"
        regexp: "{{ sha_pswd_regexp }}"
        replace: "{{ hostvars['localhost']['openldap_db_password_hash'] }}"


================================================
FILE: prepare_oim/roles/deploy_containers/auth/tasks/configure_slapd_conf.yml
================================================
#  Copyright 2024 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Extract the domain name required by LDAP
  ansible.builtin.set_fact:
    reqd_domain_name: "{{ (domain_name.split('.') | map('regex_replace', '^', 'dc=') | list) | join(',') }}"

- name: Update slapd.conf file auth service deployment
  block:

    - name: Copy slapd.conf file
      ansible.builtin.copy:
        src: "{{ role_path }}/files/slapd.conf"
        dest: "{{ slapd_conf_dest }}"
        remote_src: false
        mode: "{{ file_permissions_644 }}"
        owner: "root"

    - name: Update the domain name
      ansible.builtin.replace:
        path: "{{ slapd_conf_dest }}"
        regexp: "{{ suffix_regexp }}"
        replace: "{{ reqd_domain_name }}"

    - name: Update the db config name
      ansible.builtin.replace:
        path: "{{ slapd_conf_dest }}"
        regexp: "{{ db_config_name_regexp }}"
        replace: "cn={{ hostvars['localhost']['openldap_db_username'] }}"

    - name: Update the SHA password
      ansible.builtin.replace:
        path: "{{ slapd_conf_dest }}"
        regexp: "{{ sha_pswd_regexp }}"
        replace: "{{ hostvars['localhost']['openldap_db_password_hash'] }}"


================================================
FILE: prepare_oim/roles/deploy_containers/auth/tasks/deploy_auth_service.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

---

- name: Create auth service directory
  ansible.builtin.file:
    path: "{{ auth_service_directories }}"
    state: directory
    mode: "{{ dir_permissions_755 }}"

- name: Create openldap tls cert directory
  ansible.builtin.file:
    path: "{{ openldap_tls_certs_directory }}"
    state: directory
    mode: "{{ dir_permissions_755 }}"

- name: Include security config file
  ansible.builtin.include_tasks: include_security_config.yml

- name: Update Openldap server container configs
  block:
    - name: Update slapd.conf
      ansible.builtin.include_tasks: configure_slapd_conf.yml

    - name: Update bootstrap.ldif
      ansible.builtin.include_tasks: configure_bootstrap_ldif.yml

    - name: Generate TLS certificates
      ansible.builtin.command: |
        openssl req -new -newkey rsa:4096 -days 365 -nodes -x509 -subj "/C=/ST=/L=/O=/CN={{ admin_nic_ip }}"
        -addext "subjectAltName=IP:{{ admin_nic_ip }}"
        -keyout {{ openldap_tls_certs_directory }}/{{ rhel_cert_key }}
        -out {{ openldap_tls_certs_directory }}/{{ rhel_cert_file }}
      changed_when: false
      no_log: true

- name: Set ldap SELinux context
  ansible.builtin.command: chcon -R system_u:object_r:container_file_t:s0 "{{ openldap_tls_certs_directory }}"
  changed_when: true
  failed_when: false

- name: Check if {{ auth_service_container_name }} is already running and port is occupied # noqa: name[template]
  containers.podman.podman_container_info:
    name: "{{ auth_service_container_name }}"
  register: auth_service_container_info
  failed_when: false

- name: Check if OpenLDAP ports are occupied
  ansible.builtin.wait_for:
    host: localhost
    port: "{{ item }}"
    state: stopped
    timeout: "{{ wait_time }}"
    msg: "OpenLDAP port {{ item }} is occupied"
  register: openldap_port_check
  failed_when: false
  loop: "{{ openldap_ports }}"
  when: auth_service_container_info.containers | length == 0

- name: Check if local auth service image exists with tag {{ auth_service_image_tag }}
  containers.podman.podman_image_info:
    name: "{{ auth_service_image_name }}:{{ auth_service_image_tag }}"
  register: local_auth_image_check
  failed_when: false

- name: Check if local auth service image exists with latest tag (backward compatibility)
  containers.podman.podman_image_info:
    name: "{{ auth_service_image_name }}:latest"
  register: local_auth_image_latest_check
  failed_when: false
  when: local_auth_image_check.images | length == 0

- name: Tag latest for consistency - {{ auth_service_image_tag }}
  ansible.builtin.command: >
    podman tag {{ auth_service_image_name }}:latest
    {{ auth_service_image_name }}:{{ auth_service_image_tag }}
  when:
    - local_auth_image_check.images | length == 0
    - local_auth_image_latest_check.images | length > 0
  changed_when: true

- name: Check if local auth service image exists with tag {{ auth_service_image_tag }}
  containers.podman.podman_image_info:
    name: "{{ auth_service_image_name }}:{{ auth_service_image_tag }}"
  register: local_auth_image_check
  failed_when: false

- name: Pull auth service image from Docker Hub with retry and error handling
  when:
    - local_auth_image_check.images | length == 0
    - (local_auth_image_latest_check.images | default([]) | length == 0)
  block:
    - name: Try pulling auth service image from Docker Hub
      containers.podman.podman_image:
        name: "{{ auth_service_registry }}/{{ auth_service_image_name }}:{{ auth_service_image_tag }}"
        state: present
      register: dockerhub_pull_result
      retries: 3
      delay: 5
      until: dockerhub_pull_result is not failed

  rescue:
    - name: Log Docker Hub pull failure
      ansible.builtin.debug:
        msg: "{{ auth_service_image_pull_warning_msg }}"

- name: Tag Docker Hub image as local image for use
  ansible.builtin.command: >
    podman tag {{ auth_service_registry }}/{{ auth_service_image_name }}:{{ auth_service_image_tag }}
    {{ auth_service_image_name }}:{{ auth_service_image_tag }}
  when:
    - local_auth_image_check.images | length == 0
    - dockerhub_pull_result is defined
    - dockerhub_pull_result is not failed
  changed_when: true

- name: Verify final auth service image availability
  containers.podman.podman_image_info:
    name: "{{ auth_service_image_name }}:{{ auth_service_image_tag }}"
  register: final_auth_image_check
  failed_when: false

- name: Fail if the auth service image is not available
  ansible.builtin.fail:
    msg: "{{ auth_service_image_pull_fail_msg }}"
  when: final_auth_image_check.images | length == 0

- name: Deploy auth service container and check deployment status
  block:
    - name: Create Quadlet file for auth service
      ansible.builtin.template:
        src: "auth.j2"
        dest: "/etc/containers/systemd/{{ auth_service_container_name }}.container"
        owner: root
        group: root
        mode: "{{ auth_service_quadlet_mode }}"
      register: quadlet_out

    - name: Reload systemd if Quadlet changed
      ansible.builtin.systemd_service:
        daemon_reload: true
      when: quadlet_out.changed # noqa: no-handler

    - name: Enable and start auth service Quadlet service
      ansible.builtin.systemd_service:
        name: "{{ auth_service_container_name }}.service"
        enabled: true
        state: started

    - name: Check if auth service container is running after deployment
      containers.podman.podman_container_info:
        name: "{{ auth_service_container_name }}"
      register: auth_service_container_status

    - name: Notify user of auth service container deployment status
      ansible.builtin.debug:
        msg: "{{ auth_service_container_success_msg }}"
      when:
        - auth_service_container_status.containers | length > 0
        - auth_service_container_status.containers[0].State.Status == 'running'

  rescue:
    - name: Auth service container deployment failed
      ansible.builtin.fail:
        msg: "{{ auth_service_container_failure_msg }}"


================================================
FILE: prepare_oim/roles/deploy_containers/auth/tasks/generate_ldap_password_hashes.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Genarate password hashes for OpenLDAP database
  generate_ssha_password:
    password: "{{ hostvars['127.0.0.1']['openldap_db_password'] }}"
  register: password_hash

- name: Set variables for OpenLDAP database password
  ansible.builtin.set_fact:
    openldap_db_password_hash: "{{ password_hash.pswd_ssha }}"
  no_log: false


================================================
FILE: prepare_oim/roles/deploy_containers/auth/tasks/include_security_config.yml
================================================
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Include variable file security_config.yml
  block:
    - name: Include variable file security_config.yml
      ansible.builtin.include_vars: "{{ security_config_file }}"
      register: include_security_config
      no_log: false
  rescue:
    - name: Failed to include security_config.yml
      ansible.builtin.fail:
        msg: "{{ security_config_syntax_fail_msg }} Error: {{ include_security_config.message }}"

- name: Show security_config.yml
  ansible.builtin.debug:
    msg: "{{ security_config_file }}"


================================================
FILE: prepare_oim/roles/deploy_containers/auth/tasks/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

---

- name: Deploy auth container tasks
  ansible.builtin.include_tasks: deploy_auth_service.yml
  when:
    - hostvars['localhost']['openldap_support']


================================================
FILE: prepare_oim/roles/deploy_containers/auth/templates/auth.j2
================================================
[Unit]
Description=OpenLDAP container managed by systemd

[Container]
Image={{ auth_service_image_name }}:{{ auth_service_image_tag }}
ContainerName={{ auth_service_container_name }}

# Publish ports
{% for port in openldap_ports %}
PublishPort=0.0.0.0:{{ port }}:{{ port }}
{% endfor %}

# Mount configuration and bootstrap files (read-only, with SELinux relabel)
Volume={{ slapd_conf_dest }}:/etc/openldap/slapd.conf:ro,z
Volume={{ bootstrap_ldif_dest }}:/container-init/bootstrap.ldif:ro,z
Volume={{ openldap_tls_certs_directory }}:/etc/openldap/certs:ro,z

[Service]
Restart=always
[Install]
WantedBy=multi-user.target


================================================
FILE: prepare_oim/roles/deploy_containers/auth/vars/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

omnia_nfs_share: "{{ oim_shared_path }}/omnia"  # Define NFS share path
auth_service_directories: "{{ omnia_nfs_share }}/auth"
openldap_tls_certs_directory: "{{ auth_service_directories }}/tls_certs"
rhel_cert_file: "ldapserver.crt"
rhel_cert_key: "ldapserver.key"
openldap_ports:
  - 389
  - 636
wait_time: 10
auth_service_image_name: omnia_auth
auth_service_image_tag: "1.0"
auth_service_registry: "docker.io/dellhpcomniaaisolution"
auth_service_container_name: omnia_auth
auth_service_image_pull_fail_msg:
  - The pull of the auth service image {{ auth_service_image_name }}:{{ auth_service_image_tag }} has failed.
  - "ERROR: {{ auth_service_image_name }}:{{ auth_service_image_tag }} not found locally or on Docker Hub."
  - To resolve this, please follow these steps
  - Clone the Omnia Artifactory repository
  - git clone https://github.com/dell/omnia-artifactory -b omnia-container
  - Navigate to the repository directory and Build the auth image locally
  - ./build_images.sh auth
auth_service_image_pull_warning_msg: |
  Failed to pull {{ auth_service_image_name }}:{{ auth_service_image_tag }} from Docker Hub after 3 attempts.
  This may be due to network issues or the image not being available on Docker Hub.
  The deployment will continue, but the final image verification will determine if the image is available.
auth_service_quadlet_mode: "0644"

auth_service_container_success_msg: "The {{ auth_service_container_name }} container has been successfully deployed."
auth_service_container_failure_msg: |
  The deployment of the {{ auth_service_container_name }} container has failed. To resolve this issue,
  please run the utility/oim_cleanup.yml playbook to clean up any existing OIM resources.
  After the cleanup, you can re-run the original playbook to deploy the {{ auth_service_container_name }} container successfully.

# Usage: include_security_config.yml
security_config_file: "{{ hostvars['localhost']['input_project_dir'] }}/security_config.yml"
security_config_syntax_fail_msg: "Failed. Syntax errors present in security_config.yml. Fix errors and re-run playbook again."

# Usage: configure_slapd_conf.yml
slapd_conf_dest: "{{ auth_service_directories }}/slapd.conf"
file_permissions_644: "0644"

# Usage: configure_bootstrap_ldif.yml
bootstrap_ldif_dest: "{{ auth_service_directories }}/bootstrap.ldif"

# Usage: configure_ldap_conf.yml
ldap_conf_dest: "{{ auth_service_directories }}/ldap.conf"
# Common vars
user_home_dir: "/home"
file_permission: "0600"
sasl_nocanon_regxp: "SASL_NOCANON\ton"
sasl_nacanon_replace1: "SASL_NOCANON\ton\nBASE\t{{ reqd_domain_name }}"
sasl_nacanon_replace2: "SASL_NOCANON\ton\nURI\tldap://{{ hostvars[groups['auth_server'][0]]['ansible_env'].SSH_CONNECTION.split(' ')[2] }}"
sasl_nacanon_replace3: "SASL_NOCANON\ton\nTLS_CACERT\t{{ tls_cert_path }}"
sasl_nacanon_replace4: "SASL_NOCANON\ton\nURI\tldap://{{ hostvars[groups['auth_server'][0]]['ansible_env'].SSH_CONNECTION.split(' ')[2] }}:636"
file_mode: "0644"
oim_certs_dir: "/opt/omnia/security/certs/"

# Usage: configure_sssd_conf.yml
sssd_conf_dest: "{{ auth_service_directories }}/sssd.conf"

# Usage: configure_slapd_conf.yml
suffix_regexp: "dc=omnia,dc=test"
db_config_name_regexp: "cn=admin"
sha_pswd_regexp: "{SSHA}CcEj20AyhrDhWhFGlu01HWnn8eKP1sH3"

# Usage: configure_bootstrap_ldif.yml
common_name_regexp: "cn: admin"
domain_component: "dc: omnia"


================================================
FILE: prepare_oim/roles/deploy_containers/build_stream/handlers/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

---
# Reload systemd daemon on the OIM host
- name: Reload systemd
  ansible.builtin.systemd:
    daemon_reload: true

# Restart Build Stream container
# (Assumes systemd unit is created for the container)
- name: Restart build_stream
  ansible.builtin.systemd:
    name: "{{ build_stream_service }}"
    state: restarted
    enabled: true


================================================
FILE: prepare_oim/roles/deploy_containers/build_stream/tasks/deploy_build_stream.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

---
# -------------------------------------------------------------------
# 0) Stop/disable existing build_stream systemd service and remove container
# -------------------------------------------------------------------
- name: Check if omnia_build_stream service exists
  ansible.builtin.systemd_service:
    name: "{{ build_stream_container_name }}.service"
  register: build_stream_service_status
  failed_when: false
  changed_when: false
  no_log: true

- name: Stop and disable omnia_build_stream service if present
  ansible.builtin.systemd_service:
    name: "{{ build_stream_container_name }}.service"
    state: stopped
    enabled: false
  when: build_stream_service_status.status is defined
  failed_when: false
  changed_when: false
  no_log: true

- name: Check if omnia_build_stream container exists
  containers.podman.podman_container_info:
    name: "{{ build_stream_container_name }}"
  register: existing_container_info
  failed_when: false
  changed_when: false

- name: Remove existing omnia_build_stream container if present
  containers.podman.podman_container:
    name: "{{ build_stream_container_name }}"
    state: absent
  when: existing_container_info.containers | length > 0

# -------------------------------------------------------------------
# 1) Get metadata/config from omnia_core
# -------------------------------------------------------------------

- name: Extract configuration from metadata
  ansible.builtin.set_fact:
    omnia_path: "{{ oim_shared_path }}"
    pulp_password: "{{ hostvars['localhost']['pulp_password'] }}"
    postgres_user: "{{ hostvars['localhost']['postgres_user'] }}"
    postgres_password: "{{ hostvars['localhost']['postgres_password'] }}"
    postgres_db_name: "{{ postgres_db_name }}"
  no_log: true

# -------------------------------------------------------------------
# 2) Display build_stream_host_ip being used
# -------------------------------------------------------------------
- name: Display host IP being used
  ansible.builtin.debug:
    msg: "Using host IP: {{ build_stream_host_ip }} and port: {{ build_stream_port }} for Build stream API server"
    verbosity: 1

# -------------------------------------------------------------------
# 3) Ensure log directory exists
# -------------------------------------------------------------------
- name: Ensure build_stream log directory exists
  ansible.builtin.file:
    path: "{{ build_stream_log_dir }}"
    state: directory
    mode: "{{ build_stream_dir_mode }}"

- name: Ensure build_stream ssl parent directory exists
  ansible.builtin.file:
    path: "{{ omnia_path }}/omnia/build_stream_ssl"
    state: directory
    mode: "{{ build_stream_dir_mode }}"

- name: Ensure build_stream ssl subdirectory exists
  ansible.builtin.file:
    path: "{{ build_stream_ssl_dir }}"
    state: directory
    mode: "{{ build_stream_ssl_file_mode }}"

# -------------------------------------------------------------------
# 4) FAIL if Pulp container missing / not running
# -------------------------------------------------------------------
- name: Precheck - fail if Pulp container is missing or not running
  block:
    - name: Ensure pulp container exists
      containers.podman.podman_container_info:
        name: "{{ pulp_container_name }}"
      register: pulp_container_info

    - name: Fail if Pulp container is missing OR not running
      ansible.builtin.fail:
        msg: "{{ build_stream_pulp_not_ready_msg }}"
      when: >
        (pulp_container_info.containers | length == 0) or
        (pulp_container_info.containers[0].State.Status != "running")

# -------------------------------------------------------------------
# 5) Pull container image
# -------------------------------------------------------------------
- name: Pull omnia_build_stream image from Docker Hub
  containers.podman.podman_image:
    name: "{{ build_stream_image_name }}"
    tag: "{{ build_stream_image_tag }}"
    state: present
  register: image_pull_result

- name: Display image pull result
  ansible.builtin.debug:
    msg: "{{ build_stream_image_pull_success_msg }}"
    verbosity: 2
  when: image_pull_result is succeeded

# -------------------------------------------------------------------
# 6) Generate SSL certificates (idempotent)
# -------------------------------------------------------------------
- name: Check if Build Stream SSL certificates exist
  ansible.builtin.stat:
    path: "{{ item }}"
  register: cert_files_check
  loop:
    - "{{ build_stream_ssl_cert }}"
    - "{{ build_stream_ssl_key }}"
  no_log: true

- name: Check certificate expiration and validity
  ansible.builtin.shell: |
    set -o pipefail
    # Check if certificate is valid and not expired
    openssl x509 -checkend 86400 -noout -in {{ build_stream_ssl_cert }}
  register: cert_validity
  changed_when: false
  failed_when: false
  when: cert_files_check.results | selectattr('stat.exists') | list | length == 2
  no_log: true

- name: Verify key-certificate pairing
  ansible.builtin.shell: |
    set -o pipefail
    cert_modulus=$(openssl x509 -noout -modulus -in {{ build_stream_ssl_cert }} | openssl md5)
    key_modulus=$(openssl rsa -noout -modulus -in {{ build_stream_ssl_key }} | openssl md5)
    [ "$cert_modulus" = "$key_modulus" ]
  register: cert_key_match
  changed_when: false
  failed_when: false
  when: cert_files_check.results | selectattr('stat.exists') | list | length == 2
  no_log: true

- name: Check certificate SAN entries
  ansible.builtin.command: |
    openssl x509 -noout -ext subjectAltName -in {{ build_stream_ssl_cert }}
  register: cert_san
  changed_when: false
  failed_when: false
  when: cert_files_check.results | selectattr('stat.exists') | list | length == 2
  no_log: true

- name: Debug certificate validation results
  ansible.builtin.debug:
    msg:
      - "Files exist: {{ cert_files_check.results | selectattr('stat.exists') | list | length }}"
      - "Cert validity RC: {{ cert_validity.rc | default('undefined') }}"
      - "Key match RC: {{ cert_key_match.rc | default('undefined') }}"
      - "SAN check RC: {{ cert_san.rc | default('undefined') }}"
      - "Hostname in SAN: {{ cert_san.stdout is search('DNS:' + ansible_hostname) if cert_san.stdout is defined else 'undefined' }}"
    verbosity: 2

- name: Determine if certificate regeneration is needed
  ansible.builtin.set_fact:
    cert_regeneration_needed: >-
      {{
        (cert_files_check.results | selectattr('stat.exists') | list | length != 2) or
        (cert_files_check.results | selectattr('stat.exists') | list | length == 2 and (
          (cert_validity is defined and cert_validity.rc != 0) or
          (cert_key_match is defined and cert_key_match.rc != 0) or
          (cert_san is defined and cert_san.rc != 0) or
          (cert_san is defined and cert_san.stdout is defined and not (cert_san.stdout is search('DNS:' + ansible_hostname)))
        ))
      }}
  no_log: true

- name: Display certificate validation result
  ansible.builtin.debug:
    msg: "SSL certificate regeneration needed: {{ cert_regeneration_needed }}"
    verbosity: 2

- name: Ensure SSL certificate directory exists
  ansible.builtin.file:
    path: "{{ build_stream_ssl_dir }}"
    state: directory
    mode: "{{ build_stream_dir_mode }}"
  no_log: true

- name: Generate self-signed SSL certificate (only if needed)
  ansible.builtin.command: |
    openssl req -x509 -newkey rsa:4096 -nodes -days {{ build_stream_ssl_days }}
    -keyout {{ build_stream_ssl_key }}
    -out {{ build_stream_ssl_cert }}
    -subj "/C=US/ST=State/L=City/O=Omnia/CN={{ ansible_hostname }}"
    -addext "subjectAltName=DNS:{{ ansible_hostname }},DNS:localhost,IP:{{ ansible_default_ipv4.address }},IP:127.0.0.1,IP:{{ build_stream_host_ip }}"
  changed_when: true
  when: cert_regeneration_needed | bool
  no_log: true

- name: Set permissions on SSL certificates (only when newly generated)
  ansible.builtin.file:
    path: "{{ item }}"
    mode: "{{ build_stream_ssl_file_mode }}"
  loop:
    - "{{ build_stream_ssl_cert }}"
    - "{{ build_stream_ssl_key }}"
  when: cert_regeneration_needed | bool
  no_log: true

- name: Set execute permission on JWT key generation script
  ansible.builtin.file:
    path: "{{ build_stream_jwt_keys_script }}"
    mode: "{{ build_stream_jwt_script_mode }}"
  delegate_to: localhost
  no_log: true

- name: Ensure JWT keys directory exists
  ansible.builtin.file:
    path: "{{ build_stream_jwt_keys_dir }}"
    state: directory
    mode: "0700"
  delegate_to: localhost
  no_log: true

- name: Check if JWT keys already exist
  ansible.builtin.stat:
    path: "{{ item }}"
  register: jwt_keys_check
  loop:
    - "{{ build_stream_jwt_keys_dir }}/jwt_private.pem"
    - "{{ build_stream_jwt_keys_dir }}/jwt_public.pem"
  delegate_to: localhost
  no_log: true

- name: Validate existing JWT keys
  ansible.builtin.shell: |
    set -o pipefail
    # Check if private key is valid
    openssl rsa -in "{{ build_stream_jwt_keys_dir }}/jwt_private.pem" -check -noout
    # Check if public key is valid
    openssl rsa -pubin -in "{{ build_stream_jwt_keys_dir }}/jwt_public.pem" -check -noout
    # Check if keys match (modulus comparison)
    priv_mod=$(openssl rsa -in "{{ build_stream_jwt_keys_dir }}/jwt_private.pem" -noout -modulus | openssl md5)
    pub_mod=$(openssl rsa -pubin -in "{{ build_stream_jwt_keys_dir }}/jwt_public.pem" -noout -modulus | openssl md5)
    [ "$priv_mod" = "$pub_mod" ]
  register: jwt_keys_validation
  changed_when: false
  failed_when: false
  delegate_to: localhost
  when: jwt_keys_check.results | selectattr('stat.exists') | list | length == 2
  no_log: true

- name: Determine if JWT key regeneration is needed
  ansible.builtin.set_fact:
    jwt_regeneration_needed: >-
      {{
        (jwt_keys_check.results | selectattr('stat.exists') | list | length != 2) or
        (jwt_keys_validation.rc | default(1) != 0)
      }}
  no_log: true

- name: Display JWT key validation result
  ansible.builtin.debug:
    msg: "JWT key regeneration needed: {{ jwt_regeneration_needed }}"
    verbosity: 2

- name: Remove incomplete JWT keys if regeneration needed
  ansible.builtin.file:
    path: "{{ build_stream_jwt_keys_dir }}"
    state: absent
  delegate_to: localhost
  when: jwt_regeneration_needed | bool
  no_log: true

- name: Recreate JWT keys directory
  ansible.builtin.file:
    path: "{{ build_stream_jwt_keys_dir }}"
    state: directory
    mode: "0700"
  delegate_to: localhost
  when: jwt_regeneration_needed | bool
  no_log: true

- name: Generate JWT keys (only if needed)
  ansible.builtin.command: "{{ build_stream_jwt_keys_script }}"
  delegate_to: localhost
  when: jwt_regeneration_needed | bool
  changed_when: true
  no_log: true

# - name: Update project name in default.yml
#  ansible.builtin.replace:
#    path: "{{ build_stream_default_file }}"
#    regexp: "{{ build_stream_project_default }}"
#    replace: "{{ build_stream_project_build_stream }}"
#  delegate_to: localhost

# -------------------------------------------------------------------
# 6) Deploy quadlet using template + restart via handlers
# -------------------------------------------------------------------
- name: Deploy build_stream container and check deployment status
  block:
    - name: Ensure quadlet directory exists
      ansible.builtin.file:
        path: "{{ quadlet_dir }}"
        state: directory
        mode: "{{ build_stream_dir_mode }}"

    - name: Deploy build_stream quadlet file from template
      ansible.builtin.template:
        src: "build_stream.j2"
        dest: "{{ build_stream_quadlet_path }}"
        mode: "{{ build_stream_quadlet_file_mode }}"
      notify:
        - Reload systemd

    # Ensure systemd reload happens even if Quadlet content was already up-to-date
    - name: Force systemd to re-read Quadlet units
      ansible.builtin.systemd_service:
        daemon_reload: true

    # Execute any pending handler-triggered reload before starting the service
    - name: Apply systemd reload now
      ansible.builtin.meta: flush_handlers

    - name: Enable and start build_stream service
      ansible.builtin.systemd_service:
        name: "{{ build_stream_service }}"
        enabled: true
        state: started
      no_log: true
      changed_when: false
    - name: "Ensure build_stream readiness and migrations"
      block:
        - name: Wait until omnia_build_stream container exists and is running
          containers.podman.podman_container_info:
            name: "{{ build_stream_container_name }}"
          register: bs_info
          retries: "{{ bs_container_wait_retries }}"
          delay: "{{ bs_container_wait_delay }}"
          until:
            - bs_info.containers is defined
            - bs_info.containers | length > 0
            - bs_info.containers[0].State is defined
            - bs_info.containers[0].State.Running | bool
          no_log: true

        - name: Run Alembic database migrations inside build_stream container
          containers.podman.podman_container_exec:
            name: "{{ build_stream_container_name }}"
            command: >
              python -m alembic -c {{ bs_rsync_destination }}infra/db/alembic.ini upgrade head
            env:
              DB_USER: "{{ postgres_user }}"
              DB_PASSWORD: "{{ postgres_password }}"
              DB_HOST: "{{ admin_ip }}"
              DB_NAME: "{{ postgres_db_name }}"
          register: alembic_result
          changed_when: "'Running upgrade' in alembic_result.stdout"
          no_log: true

        - name: Display migration result
          ansible.builtin.debug:
            msg: "Database migrations completed: {{ alembic_result.stdout }}"
            verbosity: 2

      rescue:
        - name: Fail build_stream deployment safely
          ansible.builtin.fail:
            msg: "{{ build_stream_container_failure_msg }}"

    - name: Configure firewall for omnia_build_stream
      block:
        - name: Start firewalld service
          ansible.builtin.systemd:
            name: firewalld
            state: started
            enabled: true

        - name: Open build_stream port in firewall
          ansible.posix.firewalld:
            port: "{{ build_stream_firewall_port }}"
            permanent: true
            state: enabled
            immediate: true
# --------------------------------------------------------------------
# 7) Create Pulp config in build_stream container
# -------------------------------------------------------------------
    - name: Create pulp config directory in build_stream container
      containers.podman.podman_container_exec:
        name: "{{ build_stream_container_name }}"
        command: mkdir -p /root/.config/pulp
      changed_when: false

    - name: Check if Pulp configuration file exists in build_stream container
      containers.podman.podman_container_exec:
        name: "{{ build_stream_container_name }}"
        command: test -f /root/.config/pulp/cli.toml
      register: pulp_config_exists
      changed_when: false
      failed_when: false

    - name: Create Pulp config in build_stream container
      containers.podman.podman_container_exec:
        name: "{{ build_stream_container_name }}"
        command: >
          pulp config create
          --username admin
          --base-url {{ pulp_base_url }}
          --password {{ pulp_password }}
          --verify-ssl
      when: pulp_config_exists.rc != 0
      changed_when: false
      no_log: true

    - name: Test pulp status command in build_stream container
      containers.podman.podman_container_exec:
        name: "{{ build_stream_container_name }}"
        command: pulp status
      register: pulp_status_test
      changed_when: false
      failed_when: false

    - name: Fail if pulp status test is not 200
      ansible.builtin.fail:
        msg: "{{ build_stream_pulp_status_failure_msg }}"
      when: (pulp_status_test.rc != 0)
      no_log: true
# -------------------------------------------------------------------
# 8) Validate pulp HTTPS connectivity from inside build_stream
# -------------------------------------------------------------------
    - name: Build curl command
      ansible.builtin.set_fact:
        curl_cmd:
          - curl
          - --cacert
          - "{{ build_stream_pulp_cert_container_path }}/pulp_webserver.crt"   # resolves to /etc/pulp/certs/pulp_webserver.crt inside the container
          - -sS
          - -o
          - /dev/null
          - -w
          - "%{http_code}\n"
          - "{{ pulp_base_url }}/pulp/api/v3/status/"
      changed_when: false

    - name: Test HTTPS from build_stream to Pulp
      containers.podman.podman_container_exec:
        name: "{{ build_stream_container_name }}"
        argv: "{{ curl_cmd }}"
      register: curl_status
      changed_when: false
      failed_when: false

    - name: Fail if HTTPS test is not 200
      ansible.builtin.fail:
        msg: "{{ build_stream_https_failure_msg }}"
      when: (curl_status.stdout | trim) != "200"

# --------------------------------------------------------------------
# 8) Validate health API endpoint https://{{ admin_ip }}:{{ build_stream_port }}/health"
# -------------------------------------------------------------------
    - name: Verify API endpoint health
      ansible.builtin.uri:
        url: "{{ build_stream_health_endpoint }}"
        method: GET
        return_content: true
        status_code: "{{ health_check_status_code }}"
        validate_certs: true
        ca_path: "{{ build_stream_ssl_cert }}"
      register: health_check
      retries: "{{ health_check_retries }}"
      delay: "{{ health_check_delay }}"
      until: (health_check is defined) and ('status' in health_check) and (health_check.status == health_check_status_code)

  rescue:
    - name: Build_stream container deployment failed
      ansible.builtin.fail:
        msg: "{{ build_stream_container_failure_msg }}"


================================================
FILE: prepare_oim/roles/deploy_containers/build_stream/tasks/enable_watcher_service.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Read oim metadata
  ansible.builtin.slurp:
    src: "{{ oim_metadata_file }}"
  register: oim_metadata_raw
  delegate_to: localhost
  connection: local

- name: Parse oim_shared_path
  ansible.builtin.set_fact:
    oim_shared_path: "{{ (oim_metadata_raw.content | b64decode | from_yaml).oim_shared_path }}"

- name: Check build_stream directory exists in oim_shared_path
  ansible.builtin.stat:
    path: "{{ oim_shared_path }}/omnia/build_stream"
  register: build_stream_stat

- name: Fail if build_stream directory missing
  ansible.builtin.fail:
    msg: "{{ build_stream_nfs_path_error_msg }}"
  when: not build_stream_stat.stat.exists

- name: Create playbook_queue directory
  ansible.builtin.file:
    path: "{{ oim_shared_path }}/omnia/playbook_queue"
    state: directory
    mode: "{{ build_stream_dir_mode }}"

- name: Deploy playbook watcher systemd unit
  ansible.builtin.template:
    src: playbook_watcher.service.j2
    dest: "{{ watcher_systemd_path }}/{{ watcher_service_name }}"
    mode: "{{ build_stream_file_mode }}"
  notify:
    - Reload systemd

- name: Apply systemd reload for watcher
  ansible.builtin.meta: flush_handlers

- name: Restart and enable playbook watcher service
  ansible.builtin.systemd_service:
    name: "{{ watcher_service_name }}"
    enabled: true
    state: restarted

- name: Check watcher service status
  ansible.builtin.command: "systemctl status {{ watcher_service_name | regex_replace('\\.service$', '') }} --no-pager"
  register: watcher_status
  changed_when: false

- name: Show recent watcher logs
  ansible.builtin.command: "journalctl -u {{ watcher_service_name | regex_replace('\\.service$', '') }} -n 10 --no-pager"
  when: watcher_status.rc == 0
  register: watcher_logs
  changed_when: false

- name: Show recent watcher logs
  ansible.builtin.command: "journalctl -u {{ watcher_service_name | regex_replace('\\.service$', '') }} -n 10 --no-pager"
  when: watcher_status.rc == 0
  register: watcher_logs
  changed_when: false


================================================
FILE: prepare_oim/roles/deploy_containers/build_stream/tasks/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

---

- name: Ensure build_stream deployment directory exists
  ansible.builtin.file:
    path: "{{ omnia_path }}/omnia/build_stream"
    state: directory
    mode: "{{ build_stream_dir_mode }}"

- name: Sync build_stream source code from codebase to deployment location
  ansible.posix.synchronize:
    src: "{{ bs_rsync_source }}"
    dest: "{{ bs_rsync_destination }}"
    mode: push
    archive: true
    checksum: true
    rsync_opts:
      - "--exclude=.venv"
      - "--exclude=__pycache__"
      - "--exclude=*.pyc"
      - "--exclude=.pytest_cache"
      - "--exclude=.mypy_cache"
      - "--exclude=.coverage"
      - "--exclude=htmlcov"
  delegate_to: localhost

- name: Enable playbook watcher service
  ansible.builtin.include_tasks: enable_watcher_service.yml

- name: Deploy omnia_build_stream container
  ansible.builtin.include_tasks: deploy_build_stream.yml
  tags:
    - build_stream


================================================
FILE: prepare_oim/roles/deploy_containers/build_stream/templates/build_stream.j2
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

# ===============================================================
# omnia_build_stream Quadlet Service
# FastAPI Service for Omnia Build Stream Automation
# ===============================================================
[Unit]
Description=Omnia Build Stream FastAPI Container
After=omnia_core.service
Requires=omnia_core.service

[Container]
ContainerName={{ build_stream_container_name }}
HostName={{ build_stream_container_name }}
Image={{ build_stream_image_name }}:{{ build_stream_image_tag }}
Network=host

# Environment variables
Environment=HOST={{ build_stream_host_ip }}
Environment=PORT={{ build_stream_port }}
Environment=PULP_BASE_URL={{ pulp_base_url }}
Environment=PULP_USERNAME=admin
Environment=PULP_PASSWORD={{ pulp_password }}
Environment=PULP_VERIFY_SSL=true

# Pulp SSL verification (for connecting to Pulp API)
Environment=PULP_CA_BUNDLE=/etc/pulp/certs/pulp_webserver.crt
Environment=REQUESTS_CA_BUNDLE=/etc/pulp/certs/pulp_webserver.crt

# Build Stream SSL certificates (for HTTPS server)
Environment=SSL_KEYFILE=/etc/ssl/omnia/bs_key.pem
Environment=SSL_CERTFILE=/etc/ssl/omnia/bs_cert.pem
Environment=SYSTEM_ANCHOR={{ build_stream_ca_trust_anchor }}

# Database configuration
Environment=DATABASE_URL=postgresql://{{ postgres_user }}:{{ postgres_password }}@localhost:5432/{{ postgres_db_name }}

# Authentication and OAuth configuration
Environment=ANSIBLE_VAULT_PASSWORD_FILE="/opt/omnia/input/project_default/.build_stream_oauth_credentials_key"
Environment=OAUTH_CLIENTS_VAULT_PATH="/opt/omnia/input/project_default/build_stream_oauth_credentials.yml"
Environment=AUTH_CONFIG_VAULT_PATH="/opt/omnia/input/project_default/build_stream_oauth_credentials.yml"
Environment=JWT_PRIVATE_KEY_PATH="/opt/omnia/build_stream_root/api/.auth/keys/jwt_private.pem"
Environment=JWT_PUBLIC_KEY_PATH="/opt/omnia/build_stream_root/api/.auth/keys/jwt_public.pem"
Environment=BUILD_STREAM_CONFIG_PATH="/opt/omnia/build_stream/build_stream.ini"

# Volume mounts (shared from omnia_core)
Volume={{ omnia_path }}/omnia:/opt/omnia{{ selinux_option }}
Volume={{ build_stream_ssl_dir }}:/etc/ssl/omnia:ro{{ selinux_option | regex_replace('^:', ',') }}
Volume={{ build_stream_pulp_cert_host_dir }}:{{ build_stream_pulp_cert_container_path }}:ro{{ selinux_option | regex_replace('^:', ',') }}

[Service]
Restart=always

[Install]
WantedBy=multi-user.target default.target


================================================
FILE: prepare_oim/roles/deploy_containers/build_stream/templates/playbook_watcher.service.j2
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

[Unit]
Description=Omnia Playbook Watcher Service for Build Stream
Documentation=https://github.com/dell/omnia
After=network.target

[Service]
Type=simple
User=root
WorkingDirectory={{ oim_shared_path }}/omnia/build_stream
ExecStartPre=/bin/sleep {{ watcher_startup_delay_seconds }}
ExecStart={{ build_stream_watcher_exec }}
Restart=always
RestartSec={{ watcher_restart_sec }}
StandardOutput=journal
StandardError=journal

# Environment variables
Environment="PLAYBOOK_QUEUE_BASE={{ build_stream_watcher_playbook_queue_base }}"
Environment="NFS_SHARE_PATH={{ oim_shared_path }}"
Environment="POLL_INTERVAL_SECONDS={{ watcher_poll_interval_seconds }}"
Environment="MAX_CONCURRENT_JOBS={{ watcher_max_concurrent_jobs }}"
Environment="DEFAULT_TIMEOUT_MINUTES={{ watcher_default_timeout_minutes }}"
Environment="LOG_LEVEL={{ watcher_log_level }}"

# Security hardening
NoNewPrivileges={{ watcher_no_new_privileges | lower }}
PrivateTmp={{ watcher_private_tmp | lower }}

# Resource limits
LimitNOFILE={{ watcher_limit_nofile }}
MemoryMax={{ watcher_memory_max }}
CPUQuota={{ watcher_cpu_quota }}

[Install]
WantedBy=multi-user.target


================================================
FILE: prepare_oim/roles/deploy_containers/build_stream/vars/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

---

# Build Stream Container Configuration
core_container_name: "omnia_core"
build_stream_container_name: "omnia_build_stream"

# Build Stream source code location (in omnia_core container)
build_stream_source_path: "/omnia/build_stream"

# Rsync configuration for source code deployment
bs_rsync_options: "-av --checksum"
bs_rsync_source: "{{ role_path }}/../../../../build_stream/"
bs_rsync_destination: "/opt/omnia/build_stream/"

# OIM metadata file path (read from omnia_core container)
oim_metadata_file: "/opt/omnia/.data/oim_metadata.yml"

# Build Stream Image (Docker Hub)
build_stream_dockerhub_registry: "docker.io/dellhpcomniaaisolution"
build_stream_image_name: "{{ build_stream_dockerhub_registry }}/omnia_build_stream"
build_stream_image_tag: "1.0"

# Ports & Logs
build_stream_port: "{{ hostvars['localhost']['build_stream_port'] }}"
build_stream_host_ip: "{{ hostvars['localhost']['build_stream_host_ip'] }}"
build_stream_log_dir: "{{ omnia_path }}/omnia/log/build_stream"
build_stream_nfs_path_error_msg: "Directory {{ omnia_path }}/omnia/build_stream is missing; ensure oim_shared_path is mounted and populated correctly."
omnia_default_dir: "/omnia"
# Build Stream watcher service
watcher_service_name: "playbook_watcher.service"
watcher_service_src_path: "templates/playbook_watcher.service.j2"
watcher_systemd_path: "/etc/systemd/system"
build_stream_watcher_exec: "/usr/bin/python3 {{ omnia_path }}/omnia/build_stream/playbook-watcher/playbook_watcher_service.py"
watcher_restart_sec: 10
watcher_startup_delay_seconds: 20
watcher_no_new_privileges: true
watcher_private_tmp: true
watcher_limit_nofile: 4096
watcher_memory_max: "512M"
watcher_cpu_quota: "50%"
build_stream_watcher_playbook_queue_base: "{{ omnia_path }}/omnia/playbook_queue"
watcher_poll_interval_seconds: 2
watcher_max_concurrent_jobs: 1
watcher_default_timeout_minutes: 150
watcher_log_level: "INFO"

# Directory & File Modes
build_stream_file_mode: "0644"
build_stream_dir_mode: "0755"
build_stream_jwt_script_mode: "0755"

# SSL certificate configuration for build_stream
build_stream_ssl_dir: "{{ omnia_path }}/omnia/build_stream_ssl/ssl"
build_stream_ssl_cert: "{{ build_stream_ssl_dir }}/bs_cert.pem"
build_stream_ssl_key: "{{ build_stream_ssl_dir }}/bs_key.pem"
build_stream_ssl_days: 365
build_stream_ssl_file_mode: "0600"

# CA certificate paths
build_stream_ca_trust_anchor: "/etc/pki/ca-trust/source/anchors/pulp_webserver.crt"

# JWT key configuration
build_stream_jwt_keys_script: "/opt/omnia/build_stream/scripts/generate_jwt_keys.sh"
build_stream_jwt_keys_dir: "/opt/omnia/build_stream_root/api/.auth/keys"

# Project configuration
build_stream_default_file: "/opt/omnia/input/default.yml"
build_stream_project_default: "project_default"
build_stream_project_build_stream: "project_build_stream"

# Pulp certificate configuration
# Cert that build_stream will verify against
build_stream_pulp_cert_host_dir: "{{ omnia_path }}/omnia/pulp/settings/certs"
build_stream_pulp_cert_container_path: "/etc/pulp/certs"

# Cert inside pulp container (source)
pulp_container_name: "pulp"

# Pulp server URL
admin_ip: "{{ hostvars['localhost']['admin_nic_ip'] | default('localhost') }}"
pulp_base_url: "https://{{ admin_ip }}:2225"
pulp_username: "admin"
pulp_password: ""

# Quadlet
quadlet_dir: "/etc/containers/systemd"
build_stream_quadlet_path: "{{ quadlet_dir }}/{{ build_stream_container_name }}.container"
build_stream_quadlet_file_mode: "0644"

# PostgreSQL configuration (from postgres role)
postgres_user: "{{ hostvars['localhost']['postgres_user'] }}"
postgres_password: "{{ hostvars['localhost']['postgres_password'] }}"
postgres_db_name: "build_stream_db"

# Systemd service name generated by Quadlet
build_stream_service: "{{ build_stream_container_name }}.service"

# Health check
build_stream_health_endpoint: "https://{{ build_stream_host_ip }}:{{ build_stream_port }}/health"
container_ready_wait_seconds: 5
bs_container_wait_retries: 30
bs_container_wait_delay: 2
health_check_retries: 30
health_check_delay: 5
health_check_status_code: 200

# Firewall configuration
build_stream_firewall_port: "{{ build_stream_port }}/tcp"

# Certificate file permissions
build_stream_cert_file_mode: '0644'

# User messages
build_stream_image_pull_success_msg:
  - "Successfully pulled image from Docker Hub"
  - "Image: {{ build_stream_image_name }}:{{ build_stream_image_tag }}"

build_stream_container_failure_msg: |
  The deployment of the {{ build_stream_container_name }} container has failed. To resolve this issue,
  please run the utility/oim_cleanup.yml playbook to clean up any existing OIM resources.
  After the cleanup, you can re-run the original playbook to deploy the {{ build_stream_container_name }} container successfully.

build_stream_pulp_not_ready_msg: |
  Pulp container '{{ pulp_container_name }}' is not ready.
  Exists={{ (pulp_container_info.containers | length) > 0 }},
  State={{ (pulp_container_info.containers[0].State.Status
           if (pulp_container_info.containers | length) > 0 else 'missing') }}.
  Run oim_cleanup and re-run prepare_oim.yml.

build_stream_https_failure_msg: |
  HTTPS connectivity to Pulp failed from build_stream.
  HTTP={{ curl_status.stdout | trim }}.
  Since SAN contains DNS:{{ admin_ip }}, ensure pulp_base_url is https://{{ admin_ip }}:2225 (current={{ pulp_base_url }}).


================================================
FILE: prepare_oim/roles/deploy_containers/common/tasks/aarch64_prereq.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Create openchami aarch64 directory if not exists
  ansible.builtin.file:
    path: "{{ ochami_aarch64_dir }}"
    state: directory
    mode: "{{ dir_permissions_755 }}"

- name: Download regctl binary (aarch64)
  ansible.builtin.get_url:
    url: "{{ regctl_aarch64_url }}"
    dest: "{{ ochami_aarch64_dir }}/regctl"
    mode: "{{ dir_permissions_755 }}"


================================================
FILE: prepare_oim/roles/deploy_containers/common/tasks/add_known_hosts.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

---

- name: Add entry in known_hosts for containers
  when: target_port is defined and target_port != ""
  block:
    - name: Remove host key for oim from known_hosts
      ansible.builtin.command: ssh-keygen -R "[localhost]:{{ target_port }}"
      changed_when: true
      failed_when: false

    - name: Add host key for oim to known_hosts
      ansible.builtin.command: ssh-keyscan -p {{ target_port }} localhost >> /root/.ssh/known_hosts
      changed_when: true
      failed_when: false

- name: Add entry in known_hosts for oim
  when: target_port is undefined
  block:
    - name: Remove host key for container with specific port from known_hosts
      ansible.builtin.command: ssh-keygen -R "localhost"
      changed_when: true
      failed_when: false

    - name: Add host key for container with specific port to known_hosts
      ansible.builtin.command: ssh-keyscan localhost >> /root/.ssh/known_hosts
      changed_when: true
      failed_when: false

- name: Append to omnia core's SSH config file
  when: target_container is defined and target_port is defined
  ansible.builtin.blockinfile:
    path: "{{ ssh_config }}"
    block: |
      Host {{ target_container }}
        HostName localhost
        Port {{ target_port }}
        User root
        StrictHostKeyChecking no


================================================
FILE: prepare_oim/roles/deploy_containers/common/tasks/configure_chrony.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Install chrony
  ansible.builtin.package:
    name: chrony
    state: present

- name: Update chrony.conf
  ansible.builtin.lineinfile:
    path: "{{ chrony_conf_path }}"
    regexp: ^#allow
    line: "allow {{ hostvars['localhost']['admin_net_addr'] }}/{{ hostvars['localhost']['admin_netmask_bits'] }}"
    state: present

- name: Enable and start chronyd service
  ansible.builtin.service:
    name: chronyd
    enabled: true
    state: restarted

- name: Chronyc sources
  ansible.builtin.command: chronyc sources
  changed_when: false
  register: chronyc_sources
  until: chronyc_sources is not failed
  retries: "{{ hostvars['localhost']['fail_retry'] }}"
  delay: "{{ hostvars['localhost']['fail_delay'] }}"

- name: Retrieve NTP servers
  ansible.builtin.set_fact:
    ntp_servers: "{{ hostvars['localhost']['ntp_servers'] | default([]) }}"

- name: Configure NTP servers in chrony when ntp_servers are provided
  when:
    - ntp_servers is defined
    - ntp_servers | length > 0
  block:
    - name: Check reachability of configured NTP servers
      ansible.builtin.command: "ping -c 1 {{ item.address }}"
      register: ntp_ping_results
      changed_when: false
      failed_when: false
      loop: "{{ ntp_servers | default([]) }}"

    - name: Build list of reachable NTP servers
      ansible.builtin.set_fact:
        reachable_ntp_servers: "{{ ntp_ping_results.results | selectattr('rc', 'equalto', 0) | map(attribute='item') | list }}"

    - name: Remove existing NTP server and pool entries from chrony.conf
      ansible.builtin.lineinfile:
        path: "{{ chrony_conf_path }}"
        regexp: '^(server|pool)\s+'
        state: absent
      when:
        - reachable_ntp_servers is defined
        - reachable_ntp_servers | length > 0

    - name: Manage NTP server entries in chrony.conf
      ansible.builtin.blockinfile:
        path: "{{ chrony_conf_path }}"
        marker: "# {mark} ANSIBLE MANAGED NTP SERVERS"
        block: |
          {% for srv in reachable_ntp_servers %}
          {{ srv.type }} {{ srv.address }} iburst
          {% endfor %}
      when:
        - reachable_ntp_servers is defined
        - reachable_ntp_servers | length > 0

    - name: Enable and start chronyd service
      ansible.builtin.service:
        name: chronyd
        enabled: true
        state: restarted

    - name: Chronyc sources
      ansible.builtin.command: chronyc sources
      changed_when: false
      register: chronyc_sources
      until: chronyc_sources is not failed
      retries: "{{ hostvars['localhost']['fail_retry'] }}"
      delay: "{{ hostvars['localhost']['fail_delay'] }}"

    - name: Check reachable chrony sources
      ansible.builtin.shell: |
        set -o pipefail
        chronyc sources -n | awk 'NR>2 { if ($5+0 > 0) print $2 " " $5 }' | uniq
      args:
        executable: /bin/bash
      register: chrony_reachable_sources
      changed_when: false
      failed_when: false

    - name: Fail if no chrony sources are reachable
      ansible.builtin.fail:
        msg: "{{ chrony_no_sources_msg }}"
      when:
        - reachable_ntp_servers is defined
        - reachable_ntp_servers | length > 0
        - chrony_reachable_sources.stdout_lines | length == 0


================================================
FILE: prepare_oim/roles/deploy_containers/common/tasks/firewall_settings.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Ensure firewalld is installed
  block:
    - name: Install firewalld
      ansible.builtin.dnf:
        name: firewalld
        state: present
      tags: always

  rescue:
    - name: Failed to install firewalld
      ansible.builtin.fail:
        msg: "{{ oim_os_repo_fail_msg }}"

- name: Start and enable firewalld
  ansible.builtin.service:
    name: firewalld
    state: started
    enabled: true
  tags: always

- name: Add NTP service to firewalld
  ansible.posix.firewalld:
    service: "{{ ntp_firewall_service }}"
    permanent: true
    state: enabled
    immediate: true

- name: Enable NFS-related services
  ansible.posix.firewalld:
    service: "{{ item }}"
    state: enabled
    permanent: true
  loop: "{{ internal_nfs_services }}"
  tags: always

- name: Reload firewalld to apply changes
  ansible.builtin.command: firewall-cmd --reload
  changed_when: true
  tags: always

- name: Display open ports for verification
  ansible.builtin.command: firewall-cmd --list-all
  changed_when: true
  tags: always


================================================
FILE: prepare_oim/roles/deploy_containers/common/tasks/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

---

- name: Include metadata vars
  ansible.builtin.include_vars: "{{ omnia_metadata_file }}"
  register: include_metadata
  no_log: true
  tags: always

- name: Initialize SELinux policy
  ansible.builtin.set_fact:
    selinux_option: ":z"
  tags: always

- name: Set SELinux policy
  ansible.builtin.set_fact:
    selinux_option: ""
  when:
    - omnia_share_option == 'NFS'
    - nfs_type == 'external'
  tags: always

- name: Set variables for containers deployment
  ansible.builtin.set_fact:
    admin_nic: "{{ hostvars['localhost']['admin_nic'] }}"
    admin_nic_ip: "{{ hostvars['localhost']['admin_nic_ip'] }}"
    admin_net_addr: "{{ hostvars['localhost']['admin_net_addr'] }}"
    admin_netmask_bits: "{{ hostvars['localhost']['admin_netmask_bits'] }}"
    docker_username: "{{ hostvars['localhost']['docker_username'] }}"
    docker_password: "{{ hostvars['localhost']['docker_password'] }}"
  no_log: true
  tags: always

- name: Export firewall ports for containers
  ansible.builtin.include_tasks: firewall_settings.yml

- name: Run podman login command
  ansible.builtin.include_tasks: podman_login.yml
  when: docker_username | length > 1 and docker_password | length > 1
  tags: always

- name: Configure chrony
  ansible.builtin.include_tasks: configure_chrony.yml


================================================
FILE: prepare_oim/roles/deploy_containers/common/tasks/omnia_service.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Initialize auth service variable
  ansible.builtin.set_fact:
    auth_service: ""

- name: Set auth service if openldap is present
  ansible.builtin.set_fact:
    auth_service: "omnia_auth.service"
  when: hostvars['localhost']['openldap_support']

- name: Initialize build_stream services variable
  ansible.builtin.set_fact:
    build_stream_service: ""
    playbook_watcher_service: ""
    omnia_postgres_service: ""

- name: Set build_stream services if enabled
  ansible.builtin.set_fact:
    build_stream_service: "omnia_build_stream.service"
    playbook_watcher_service: "playbook_watcher.service"
    omnia_postgres_service: "omnia_postgres.service"
  when: hostvars['localhost']['enable_build_stream'] | default(false) | bool

- name: Start network manager services
  ansible.builtin.systemd:
    name: "{{ item }}"
    state: restarted
    enabled: true
  with_items: "{{ network_services }}"

- name: Create omnia.target service
  ansible.builtin.template:
    src: "{{ item.src }}"
    dest: "{{ item.dest }}"
    mode: "{{ item.mode }}"
  with_items: "{{ omnia_service_path }}"

- name: Start the omnia.target service
  ansible.builtin.systemd:
    name: omnia.target
    daemon_reload: true
    state: started
    enabled: true


================================================
FILE: prepare_oim/roles/deploy_containers/common/tasks/package_installation.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
- name: Install required packages
  block:
    - name: Install required packages
      ansible.builtin.package:
        name: "{{ item }}"
        state: present
      loop: "{{ oim_packages }}"
      register: oim_pkg_result
  rescue:
    - name: Fail if required package installation fails
      ansible.builtin.fail:
        msg: >-
          {{ prepare_oim_pkg_fail_msg.splitlines() | join(' ') }}
          Failed package(s): {{ oim_pkg_result.results | selectattr('failed', 'defined') | selectattr('failed') | map(attribute='item') | list | join(', ') }}
          Error: {{ (oim_pkg_result.results | selectattr('failed', 'defined') | selectattr('failed') | map(attribute='msg') | list | first) | default('') }}


================================================
FILE: prepare_oim/roles/deploy_containers/common/tasks/podman_login.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
- name: Podman login
  ansible.builtin.command: "{{ login_cmd }}"
  changed_when: true
  register: podman_login_output
  retries: "{{ retry_count }}"
  delay: "{{ delay_time }}"
  until: podman_login_output.rc == 0
  failed_when: false
  no_log: true

- name: Podman login check
  ansible.builtin.fail:
    msg: "{{ podman_login_fail_msg }} Error: {{ podman_login_output.stderr }}"
  when: podman_login_output.rc != 0


================================================
FILE: prepare_oim/roles/deploy_containers/common/tasks/prepare_oim_completion.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Create directory if it doesn't exist
  ansible.builtin.file:
    path: "{{ telemetry_dir }}"
    state: directory
    mode: "{{ dir_permissions_755 }}"

- name: Check if bmc group data file exists
  ansible.builtin.stat:
    path: "{{ bmc_group_data_filename }}"
  register: bmc_group_data_status
  failed_when: false

- name: Create bmc group data file if it doesn't exist
  ansible.builtin.template:
    src: "{{ bmc_group_data_template }}"
    dest: "{{ bmc_group_data_filename }}"
    mode: "{{ file_permissions }}"
  when: not bmc_group_data_status.stat.exists

- name: Clone iDRAC Telemetry Scripting repository
  block:
    - name: Checkout iDRAC Telemetry GitHub repo
      ansible.builtin.git:
        repo: "{{ idrac_telemetry_scripting_repo }}"
        dest: "{{ idrac_telemetry_scripting_clone_dest }}"
        version: "{{ idrac_telemetry_scripting_stable_commit }}"
        update: false
      register: clone_idrac_script
      until: clone_idrac_script is succeeded
      retries: "{{ max_retries }}"
      delay: "{{ delay_count }}"
  rescue:
    - name: Fail if iDRAC telemetry Git clone fails
      ansible.builtin.fail:
        msg: "{{ idrac_script_git_clone_fail_msg.splitlines() | join(' ') }}"
      when: clone_idrac_script is failed

- name: Prepare oim completion
  ansible.builtin.debug:
    msg: >-
      {{
        (prepare_oim_completion_msg_build_stream if hostvars['localhost']['enable_build_stream'] | bool
         else prepare_oim_completion_msg).splitlines() | join(' ')
      }}


================================================
FILE: prepare_oim/roles/deploy_containers/common/templates/bmc_group_data.j2
================================================
BMC_IP,GROUP_NAME,PARENT


================================================
FILE: prepare_oim/roles/deploy_containers/common/templates/omnia.service.j2
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.

[Unit]
Description=Top-level target for Omnia Core and OpenCHAMI
Requires=omnia_core.service openchami.target pulp.service registry.service minio.service {{ auth_service }} {{ build_stream_service }} {{ playbook_watcher_service }} {{ omnia_postgres_service }}
After=network.target
Wants=network-online.target

[Install]
WantedBy=multi-user.target default.target


================================================
FILE: prepare_oim/roles/deploy_containers/common/vars/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# Usage: main.yml
omnia_metadata_file: "/opt/omnia/.data/oim_metadata.yml"

# Usage: firewall_settings.yml
oim_os_repo_fail_msg: |
  Failed to install firewalld. This could be due to the OS repository not being configured on OIM.
  Please configure the OS repository on OIM and rerun the playbook.

internal_nfs_services:
  - nfs
  - rpc-bind
  - mountd

ntp_firewall_service: ntp

# Packages required on OIM
oim_packages:
  - nfs-utils
  - nfs4-acl-tools
  - git
  - make
prepare_oim_pkg_fail_msg: |
  Failed to install required packages. Please ensure the repository is
  configured on OIM and rerun the playbook.

# Usage: prepare_oim_completion.yml
telemetry_dir: "/opt/omnia/telemetry"
dir_permissions_755: "0755"
bmc_group_data_filename: "{{ telemetry_dir }}/bmc_group_data.csv"
bmc_group_data_template: "bmc_group_data.j2"
file_permissions: "0644"
idrac_telemetry_scripting_repo: "https://github.com/dell/iDRAC-Telemetry-Scripting.git"
idrac_telemetry_scripting_stable_commit: "f6999f5"
idrac_telemetry_scripting_clone_dest: "{{ telemetry_dir }}/iDRAC-Telemetry-Scripting"
max_retries: 10
delay_count: 5
git_install_timeout: 300
git_install_fail_msg: |
  Failed to install git. Please ensure the OS repository is configured on OIM.
  Configure the repository and rerun the playbook.
idrac_script_git_clone_fail_msg: |
  Failed to clone iDRAC Telemetry GitHub repository from {{ idrac_telemetry_scripting_repo }}
  to {{ idrac_telemetry_scripting_clone_dest }}. Please check network connectivity and rerun the playbook.
prepare_oim_completion_msg: |
  The playbook prepare_oim.yml has completed successfully. To create the offline repositories and
  registry for the cluster nodes, please execute the playbook local_repo/local_repo.yml as the next step.
prepare_oim_completion_msg_build_stream: |
  The playbook prepare_oim.yml has completed successfully. To deploy GitLab and enable Build Stream
  pipeline execution, please execute the playbook gitlab/gitlab.yml as the next step.

# podman_login.yml
login_cmd: "podman login docker.io -u {{ docker_username }} -p {{ docker_password }}"
retry_count: "5"
delay_time: "10"
podman_login_fail_msg: "Podman login failed. Please ensure the podman login credentials in the input/omnia_config_credentials.yml are valid.
 If they are, this error can occur due to a pull limit issue or multiple requests. Please try running the playbook again after waiting for a while."

# Usage: add_known_hosts.yml
ssh_config: "/root/.ssh/config"

# Usage: omnia_service.yml
omnia_service_path:
  - { src: "{{ role_path }}/templates/omnia.service.j2", dest: "/etc/systemd/system/omnia.target", mode: "0644" }
network_services:
  - network-online.target
  - NetworkManager-wait-online.service

# Usage: configure_chrony.yml
chrony_conf_path: "/etc/chrony.conf"
chrony_no_sources_msg: "No chrony sources are reachable. Please give a valid NTP server configuration in network_spec.yml and re-run prepare_oim playbook."

# Usage: aarch64_prereq.yml
ochami_aarch64_dir: "/opt/omnia/openchami/aarch64"
regctl_aarch64_url: "https://github.com/regclient/regclient/releases/latest/download/regctl-linux-arm64"


================================================
FILE: prepare_oim/roles/deploy_containers/openchami/tasks/deploy_openchami.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Create openchami directory
  ansible.builtin.file:
    path: "{{ item }}"
    state: directory
    mode: "{{ dir_permissions_755 }}"
  with_items:
    - "{{ openchami_clone_path }}"
    - "{{ openchami_log_dir }}"

- name: Verify the openchami clone status
  ansible.builtin.stat:
    path: "{{ openchami_clone_path }}/dell/podman-quadlets"
  register: clone_status

- name: Clone the openchami repository
  ansible.builtin.git:
    repo: "{{ openchami_git_repo }}"
    dest: "{{ openchami_clone_path }}"
    version: "{{ openchami_git_version }}"
  register: clone_openchami
  until: clone_openchami is not failed
  retries: "{{ clone_retry }}"
  delay: "{{ clone_delay }}"
  when: not clone_status.stat.exists

- name: Load the openchami configs vars
  ansible.builtin.template:
    src: "{{ openchami_config_vars_template }}"
    dest: "{{ openchami_config_vars_path }}"
    mode: "{{ file_permissions_644 }}"

- name: Load the openchami inventory
  ansible.builtin.template:
    src: "{{ openchami_inventory_template }}"
    dest: "{{ openchami_inventory_file }}"
    mode: "{{ file_permissions_644 }}"

- name: Deploy openchami containers
  ansible.builtin.shell: |
    set -o pipefail
    ansible-playbook {{ openchami_clone_path }}/dell/podman-quadlets/configs.yaml \
    -i {{ openchami_clone_path }}/dell/podman-quadlets/inventory -v \
    -e "minio_s3_username={{ minio_s3_username }}" \
    -e "minio_s3_password={{ minio_s3_password }}" \
    --extra-vars "@{{ openchami_config_vars_path }}" -v | \
    /usr/bin/tee {{ openchami_configs_log_path }}
  async: 3600  # Set async timeout (e.g., 1 hour)
  poll: 0  # Non-blocking (continue the playbook without waiting for completion)
  register: openchami_deploy  # Register the result to capture job ID
  changed_when: true

- name: Wait for openchami installation
  block:
    - name: Wait for the openchami installation to finish. Logs can be checked at {{ openchami_configs_log_path }}
      ansible.builtin.async_status:
        jid: "{{ openchami_deploy.ansible_job_id }}"  # Job ID from the previous task
      register: job_result
      until: job_result.finished
      retries: "{{ job_retry }}"  # Retry the task {{ job_retry }} times
      delay: "{{ job_delay }}"   # Wait {{ job_delay }} seconds between retries
      no_log: true
  rescue:
    - name: Openchami installation failed
      ansible.builtin.fail:
        msg: "{{ openchami_install_fail_msg }}"

- name: Set openchami SELinux context
  ansible.builtin.command: chcon -R system_u:object_r:container_file_t:s0 "{{ oim_shared_path }}/omnia/openchami"
  changed_when: true
  failed_when: false


================================================
FILE: prepare_oim/roles/deploy_containers/openchami/tasks/deployment_prereq.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Check if OpenCHAMI images already exist
  ansible.builtin.command:
    cmd: "podman image exists {{ item }}"
  loop: "{{ openchami_images }}"
  register: openchami_image_exists
  changed_when: false
  failed_when: false

- name: Pull OpenCHAMI images using Podman when missing
  ansible.builtin.command:
    cmd: "podman pull {{ item.item }}"
  loop: "{{ openchami_image_exists.results }}"
  loop_control:
    label: "{{ item.item }}"
  register: pull_result
  retries: "{{ pull_image_retries }}"
  delay: "{{ pull_image_delay }}"
  until: pull_result.rc == 0
  changed_when: false
  when: item.rc != 0

- name: Fail if any OpenCHAMI image pull failed
  ansible.builtin.fail:
    msg: "Failed to pull OpenCHAMI image: {{ item.item }}. Error: {{ item.stderr }}"
  loop: "{{ pull_result.results | default([]) }}"
  when: item.rc is defined and item.rc != 0


================================================
FILE: prepare_oim/roles/deploy_containers/openchami/tasks/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Deploy openchami
  ansible.builtin.include_tasks: deploy_openchami.yml
  when: not hostvars['oim']['openchami_install_status']


================================================
FILE: prepare_oim/roles/deploy_containers/openchami/tasks/verify_openchami.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Initialize openchami_install_status
  ansible.builtin.set_fact:
    openchami_install_status: false

- name: Openchami cluster authentication
  ansible.builtin.include_tasks: "{{ role_path }}/../../../../common/tasks/common/openchami_auth.yml"

- name: Verify ochami installation
  environment: "{{ ochami_env }}"
  when: access_token_result.rc == 0
  block:
    - name: Verify ochami dependencies # noqa: command-instead-of-module
      ansible.builtin.command:
        systemctl list-dependencies openchami.target
      register: openchami_dependencies
      changed_when: false

    - name: Openchami dependencies output
      ansible.builtin.debug:
        msg: "{{ openchami_dependencies.stdout_lines }}"
        verbosity: 2

    - name: Verify ochami bss status
      ansible.builtin.command:
        ochami bss service status
      register: openchami_bss_status
      changed_when: false
      failed_when: false

    - name: Openchami bss status output
      ansible.builtin.debug:
        msg: "{{ openchami_bss_status.stdout_lines }}"
        verbosity: 2

    - name: Verify ochami smd status
      ansible.builtin.command:
        ochami smd service status
      register: openchami_smd_status
      changed_when: false
      failed_when: false

    - name: Openchami smd status output
      ansible.builtin.debug:
        msg: "{{ openchami_smd_status.stdout_lines }}"
        verbosity: 2

    - name: Verify s3 bucket
      ansible.builtin.command: s3cmd ls
      changed_when: false
      register: s3_bucket_output
      failed_when: false

    - name: Set openchami_install_status
      ansible.builtin.set_fact:
        openchami_install_status: true
      when:
        - openchami_bss_status.rc == 0
        - openchami_smd_status.rc == 0
        - s3_bucket_output.rc == 0
        - '"s3://boot-images" in s3_bucket_output.stdout'


================================================
FILE: prepare_oim/roles/deploy_containers/openchami/templates/configs.yaml.j2
================================================
cluster_name: "{{ oim_node_name }}"
cluster_domain: "{{ domain_name }}"
cluster_boot_ip: "{{ admin_nic_ip }}"
cluster_boot_interface: "{{ admin_nic }}"
coredhcp_dhcp_pool: "{{ network_data.admin_network.dynamic_range | split('-') | first }} {{ network_data.admin_network.dynamic_range | split('-') | last }}"
coredhcp_netmask: "{{ (admin_nic_ip + '/' + network_data.admin_network.netmask_bits) | ansible.utils.ipaddr('netmask') }}"
coredhcp_lease_duration: "{{ default_lease_time }}s"
openchami_work_dir: "{{ openchami_work_dir }}"
data_oci_dir: "{{ data_oci_dir }}"
data_s3_dir: "{{ data_s3_dir }}"
s3_work_dir: "{{ s3_work_dir }}"
cluster_shortname: "nid"
cluster_nidlength: 3

================================================
FILE: prepare_oim/roles/deploy_containers/openchami/templates/inventory.yaml.j2
================================================
[ochami]
localhost ansible_port=22 ansible_ssh_common_args="-o StrictHostKeyChecking=no"


================================================
FILE: prepare_oim/roles/deploy_containers/openchami/vars/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# Usage: deploy_openchami.yml
openchami_git_repo: https://github.com/OpenCHAMI/deployment-recipes.git
openchami_share_dir: /opt/omnia/openchami
openchami_clone_path: "{{ openchami_share_dir }}/deployment-recipes"
openchami_git_version: 5be8c1e356e26b6abd2ec622a36117fda587eb34
clone_retry: "5"
clone_delay: "10"
dir_permissions_755: "0755"
file_permissions_644: "0644"
openchami_log_dir: /opt/omnia/log/openchami
openchami_configs_log_path: "{{ openchami_log_dir }}/configs.log"
openchami_inventory_template: "{{ role_path }}/templates/inventory.yaml.j2"
openchami_inventory_file: "{{ openchami_clone_path }}/dell/podman-quadlets/inventory/01-ochami"
openchami_config_vars_path: "/opt/omnia/openchami/configs_vars.yaml"
openchami_config_vars_template: "{{ role_path }}/templates/configs.yaml.j2"
openchami_install_fail_msg: "Failed to install OpenCHAMI. Please check the logs at {{ openchami_configs_log_path }}"

# vars passed to openchami installation
openchami_work_dir: "{{ oim_shared_path }}/omnia/openchami/workdir"
data_oci_dir: "{{ oim_shared_path }}/omnia/openchami/s3/data/oci"
data_s3_dir: "{{ oim_shared_path }}/omnia/openchami/s3/data/s3"
s3_work_dir: "{{ oim_shared_path }}/omnia/openchami/s3"

# Usage: deploy_openchami.yml - pull openchami images
pull_image_retries: 5
pull_image_delay: 10

# OpenCHAMI image tags
openchami_local_ca_tag: "v0.2.2"
openchami_opaal_tag: "v0.3.10"
openchami_smd_tag: "v2.18.0"
openchami_bss_tag: "v1.32.0"
openchami_cloud_init_tag: "v1.2.3"
openchami_coredhcp_tag: "v0.3.0"
# Third-party image tags for OpenCHAMI
minio_tag: "latest"
postgres_tag: "11.5-alpine"
hydra_tag: "v2.3"
haproxy_tag: "latest"
registry_tag: "latest"
curl_tag: "latest"
acme_tag: "3.1.1"

# OpenCHAMI images list for podman pull on OIM
openchami_images:
  - "ghcr.io/openchami/local-ca:{{ openchami_local_ca_tag }}"
  - "ghcr.io/openchami/opaal:{{ openchami_opaal_tag }}"
  - "ghcr.io/openchami/smd:{{ openchami_smd_tag }}"
  - "ghcr.io/openchami/bss:{{ openchami_bss_tag }}"
  - "ghcr.io/openchami/cloud-init:{{ openchami_cloud_init_tag }}"
  - "ghcr.io/openchami/coredhcp:{{ openchami_coredhcp_tag }}"
  - "docker.io/minio/minio:{{ minio_tag }}"
  - "docker.io/library/postgres:{{ postgres_tag }}"
  - "docker.io/oryd/hydra:{{ hydra_tag }}"
  - "cgr.dev/chainguard/haproxy:{{ haproxy_tag }}"
  - "docker.io/library/registry:{{ registry_tag }}"
  - "cgr.dev/chainguard/curl:{{ curl_tag }}"
  - "docker.io/neilpang/acme.sh:{{ acme_tag }}"

# Usage: verify_openchami.yml
cluster_env_key: "{{ oim_node_name | upper }}_ACCESS_TOKEN"


================================================
FILE: prepare_oim/roles/deploy_containers/postgres/tasks/deploy_postgres.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

---

# Check and remove existing postgres container if running
- name: Check if omnia_postgres service exists
  ansible.builtin.systemd:
    name: "{{ postgres_container_name }}.service"
  register: postgres_service_status
  failed_when: false
  changed_when: false
  no_log: true

- name: Stop omnia_postgres service if running
  ansible.builtin.systemd:
    name: "{{ postgres_container_name }}.service"
    state: stopped
    enabled: false
  when: postgres_service_status.status is defined
  failed_when: false
  changed_when: false
  no_log: true

- name: Check if omnia_postgres container exists
  containers.podman.podman_container_info:
    name: "{{ postgres_container_name }}"
  register: existing_container_info
  failed_when: false

- name: Remove existing omnia_postgres container
  containers.podman.podman_container:
    name: "{{ postgres_container_name }}"
    state: absent
  when: existing_container_info.containers | length > 0

- name: Extract configuration from metadata
  ansible.builtin.set_fact:
    omnia_path: "{{ oim_shared_path }}"

# Create required directories
- name: Create data directory for omnia_postgres
  ansible.builtin.file:
    path: "{{ postgres_data_dir }}"
    state: directory
    mode: "{{ postgres_dir_mode }}"

# Pull container image
- name: Pull omnia_postgres image from Docker Hub
  containers.podman.podman_image:
    name: "{{ postgres_image }}"
    tag: "{{ postgres_image_tag }}"
    state: present
  register: image_pull_result

- name: Display image pull result
  ansible.builtin.debug:
    msg: "{{ postgres_image_pull_success_msg }}"
    verbosity: 2
  when: image_pull_result is succeeded

# Deploy container using Quadlet and check deployment status
- name: Deploy postgres container and check deployment status
  block:
    - name: Create Quadlet service file
      ansible.builtin.template:
        src: postgres.j2
        dest: "{{ postgres_quadlet_path }}"
        mode: "{{ postgres_quadlet_file_mode }}"
      register: quadlet_out

    - name: Reload systemd if Quadlet changed
      ansible.builtin.systemd_service:
        daemon_reload: true
      when: quadlet_out.changed # noqa: no-handler

    - name: Enable and start postgres service
      ansible.builtin.systemd_service:
        name: "{{ postgres_container_name }}.service"
        enabled: true
        state: started
      no_log: true
      changed_when: false

    - name: Restart postgres container if Quadlet changed
      ansible.builtin.systemd_service:
        state: restarted
        name: "{{ postgres_container_name }}.service"
      when: quadlet_out.changed # noqa: no-handler
      no_log: true
      changed_when: false

    - name: Wait for PostgreSQL to be ready
      ansible.builtin.pause:
        seconds: "{{ postgres_ready_wait_seconds }}"

    - name: Check if postgres container is running after deployment
      containers.podman.podman_container_info:
        name: "{{ postgres_container_name }}"
      register: postgres_container_status
      no_log: true

    - name: Wait for PostgreSQL to accept connections
      containers.podman.podman_container_exec:
        name: "{{ postgres_container_name }}"
        command: pg_isready -U {{ postgres_user }}
      register: pg_ready
      retries: "{{ postgres_ready_retries }}"
      delay: "{{ postgres_ready_delay }}"
      until: pg_ready.rc == 0
      changed_when: false
      no_log: true

    - name: Create temporary directory for initialization script
      ansible.builtin.tempfile:
        state: directory
        suffix: _postgres_init
      register: temp_init_dir

    - name: Generate database initialization script
      ansible.builtin.template:
        src: init_build_stream_db.sql.j2
        dest: "{{ temp_init_dir.path }}/init_build_stream_db.sql"
        mode: "0644"

    - name: Check if build_stream_db exists
      containers.podman.podman_container_exec:
        name: "{{ postgres_container_name }}"
        command: psql -U {{ postgres_user }} -d {{ postgres_db_name }} -tAc "SELECT 1"
      register: db_exists_check
      changed_when: false
      failed_when: false
      no_log: true

    - name: Create build_stream_db database if it doesn't exist
      containers.podman.podman_container_exec:
        name: "{{ postgres_container_name }}"
        command: createdb -U {{ postgres_user }} {{ postgres_db_name }}
      when: db_exists_check.rc != 0
      register: db_create_result
      changed_when: db_create_result.rc == 0
      failed_when: db_create_result.rc != 0 and 'already exists' not in db_create_result.stderr
      no_log: true

    - name: Copy initialization script to postgres container
      ansible.builtin.command:
        cmd: podman cp "{{ temp_init_dir.path }}/init_build_stream_db.sql" "{{ postgres_container_name }}:/tmp/init_build_stream_db.sql"
      changed_when: true

    - name: Set up database schema permissions
      containers.podman.podman_container_exec:
        name: "{{ postgres_container_name }}"
        command: psql -U {{ postgres_user }} -d {{ postgres_db_name }} -f /tmp/init_build_stream_db.sql
      register: db_init_result
      changed_when: false
      no_log: true

    - name: Display database initialization result
      ansible.builtin.debug:
        msg: "{{ db_init_result.stdout_lines }}"
        verbosity: 2

    - name: Remove initialization script from container
      containers.podman.podman_container_exec:
        name: "{{ postgres_container_name }}"
        command: rm -f /tmp/init_build_stream_db.sql
      changed_when: false

    - name: Remove temporary initialization directory
      ansible.builtin.file:
        path: "{{ temp_init_dir.path }}"
        state: absent

    - name: Notify user of postgres container deployment status
      ansible.builtin.debug:
        msg: "{{ postgres_container_success_msg }}"
      when:
        - postgres_container_status.containers | length > 0
        - postgres_container_status.containers[0].State.Status == 'running'

  rescue:
    - name: Postgres container deployment failed
      ansible.builtin.fail:
        msg: "{{ postgres_container_failure_msg }}"


================================================
FILE: prepare_oim/roles/deploy_containers/postgres/tasks/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

---

- name: Deploy omnia_postgres container
  ansible.builtin.include_tasks: deploy_postgres.yml
  tags:
    - postgres


================================================
FILE: prepare_oim/roles/deploy_containers/postgres/templates/init_build_stream_db.sql.j2
================================================
-- Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
--
-- Licensed under the Apache License, Version 2.0 (the "License");
-- you may not use this file except in compliance with the License.
-- You may obtain a copy of the License at
--
--     http://www.apache.org/licenses/LICENSE-2.0
--
-- Unless required by applicable law or agreed to in writing, software
-- distributed under the License is distributed on an "AS IS" BASIS,
-- WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-- See the License for the specific language governing permissions and
-- limitations under the License.

-- Initialize BuildStream Database Schema Permissions
-- Note: The database {{ postgres_db_name }} and user {{ postgres_user }} already exist
-- (created by POSTGRES_DB and POSTGRES_USER environment variables)

-- Ensure schema permissions are set correctly
GRANT ALL ON SCHEMA public TO {{ postgres_user }};
GRANT ALL PRIVILEGES ON ALL TABLES IN SCHEMA public TO {{ postgres_user }};
GRANT ALL PRIVILEGES ON ALL SEQUENCES IN SCHEMA public TO {{ postgres_user }};

-- Set default privileges for future objects created by any user
ALTER DEFAULT PRIVILEGES IN SCHEMA public GRANT ALL ON TABLES TO {{ postgres_user }};
ALTER DEFAULT PRIVILEGES IN SCHEMA public GRANT ALL ON SEQUENCES TO {{ postgres_user }};


================================================
FILE: prepare_oim/roles/deploy_containers/postgres/templates/postgres.j2
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

# ===============================================================
# omnia_postgres Quadlet Service
# PostgreSQL Database for Omnia BuildStream
# ===============================================================
[Unit]
Description=PostgreSQL Database for Omnia BuildStream
After=omnia_core.service
Requires=omnia_core.service

[Container]
ContainerName={{ postgres_container_name }}
HostName={{ postgres_container_name }}
Image={{ postgres_image }}:{{ postgres_image_tag }}
Network=host

# Environment variables
Environment=POSTGRES_USER={{ postgres_user }}
Environment=POSTGRES_PASSWORD="{{ postgres_password }}"
Environment=POSTGRES_DB={{ postgres_db_name }}

# Volume mounts
Volume={{ postgres_data_dir }}:/var/lib/postgresql/data{{ selinux_option }}

[Service]
Restart=always

[Install]
WantedBy=multi-user.target default.target


================================================
FILE: prepare_oim/roles/deploy_containers/postgres/vars/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

---

# PostgreSQL Container Configuration
postgres_container_name: "omnia_postgres"

# OIM metadata file path
oim_metadata_file: "/opt/omnia/.data/oim_metadata.yml"

# Docker Hub configuration
postgres_dockerhub_registry: "docker.io/library"
postgres_image: "{{ postgres_dockerhub_registry }}/postgres"
postgres_image_tag: "16"
postgres_port: 5432

# Database configuration
postgres_user: "{{ hostvars['localhost']['postgres_user'] }}"
postgres_password: "{{ hostvars['localhost']['postgres_password'] }}"
postgres_db_name: "build_stream_db"

# Storage configuration
postgres_data_dir: "{{ omnia_path }}/omnia/postgres/data"

# Directory permissions
postgres_dir_mode: "0750"

# Quadlet service file path
postgres_quadlet_path: "/etc/containers/systemd/{{ postgres_container_name }}.container"
postgres_quadlet_file_mode: "0644"

# Wait for PostgreSQL to be ready
postgres_ready_wait_seconds: 10
postgres_ready_retries: 12
postgres_ready_delay: 5

# Messages
postgres_image_pull_success_msg:
  - "Successfully pulled PostgreSQL image from Docker Hub"
  - "Image: {{ postgres_image }}:{{ postgres_image_tag }}"
postgres_container_success_msg: "The {{ postgres_container_name }} container has been successfully deployed."
postgres_container_failure_msg: |
  The deployment of the {{ postgres_container_name }} container has failed.

  This failure is typically caused by database initialization issues when existing data is present.

  To resolve this issue, choose one of the following options:

  Option 1: Preserve existing database data
    - Re-run prepare_oim.yml using the SAME postgres credentials used in the previous deployment
    - This will reuse the existing database at {{ postgres_data_dir }}

  Option 2: Delete existing database data and start fresh
    - Run the cleanup playbook with postgres_backup=false:
      ansible-playbook utils/oim_cleanup.yml -e postgres_backup=false
    - This will delete the Postgres data at {{ postgres_data_dir }} (and associated data/logs)
    - After cleanup completes, re-run prepare_oim.yml to deploy a fresh {{ postgres_container_name }} container


================================================
FILE: prepare_oim/roles/deploy_containers/pulp/tasks/create_pulp_config_http.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

---
- name: Set Fact for Pulp Server with Admin IP or VIP
  ansible.builtin.set_fact:
    pulp_server_ip: "{{ hostvars['localhost']['admin_nic_ip'] }}"
  when: not hostvars['oim']['hostname_enabled']
  no_log: true

- name: Configure Pulp Server with hostname when hostname_enabled is true
  ansible.builtin.set_fact:
    pulp_server_ip: "" # Placeholder for Pulp hostname
  when: hostvars['oim']['hostname_enabled']
  no_log: true

- name: Check if Pulp configuration file exists
  ansible.builtin.stat:
    path: "{{ pulp_config_filepath }}"
  register: pulp_config_status

- name: Create Pulp config (if file doesn't exist)
  ansible.builtin.command:
    cmd: "{{ pulp_config_cmd_http }}"
  when: not pulp_config_status.stat.exists
  changed_when: false
  no_log: true

- name: Overwrite Pulp config (if file exists)
  ansible.builtin.command:
    cmd: "{{ pulp_config_cmd_overwrite_http }}"
  when: pulp_config_status.stat.exists
  changed_when: false
  no_log: true

- name: Copy config file to default path
  ansible.builtin.copy:
    src: "{{ pulp_config_filepath }}"
    dest: "{{ config_default_loc }}"
    mode: "{{ logs_dir_permission }}"
    remote_src: true


================================================
FILE: prepare_oim/roles/deploy_containers/pulp/tasks/create_pulp_config_https.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

---
- name: Set Fact for Pulp Server with Admin IP or VIP
  ansible.builtin.set_fact:
    pulp_server_ip: "{{ hostvars['localhost']['admin_nic_ip'] }}"
  when: not hostvars['oim']['hostname_enabled']
  no_log: true

- name: Configure Pulp Server with hostname when hostname_enabled is true
  ansible.builtin.set_fact:
    pulp_server_ip: "" # Placeholder for Pulp hostname
  when: hostvars['oim']['hostname_enabled']
  no_log: true

- name: Check if Pulp configuration file exists
  ansible.builtin.stat:
    path: "{{ pulp_config_filepath }}"
  register: pulp_config_status

- name: Create Pulp config (if file doesn't exist)
  ansible.builtin.command:
    cmd: "{{ pulp_config_cmd_https }}"
  when: not pulp_config_status.stat.exists
  changed_when: false
  no_log: true

- name: Overwrite Pulp config (if file exists)
  ansible.builtin.command:
    cmd: "{{ pulp_config_cmd_overwrite_https }}"
  when: pulp_config_status.stat.exists
  changed_when: false
  no_log: true

- name: Copy config file to default path
  ansible.builtin.copy:
    src: "{{ pulp_config_filepath }}"
    dest: "{{ config_default_loc }}"
    mode: "{{ logs_dir_permission }}"
    remote_src: true

- name: Run pulp status command on omnia_core container
  ansible.builtin.command: /usr/local/bin/pulp status
  changed_when: false
  register: pulp_status_output
  failed_when: false

- name: Check if track file exists
  ansible.builtin.stat:
    path: "{{ track_file_path }}"
  register: file_check

- name: Tasks to generate pulp crt
  when: >
    (
      (hostvars['oim']['pulp_container_status'] == 'running') and
      (pulp_status_output.rc != 0) and
      (not file_check.stat.exists)
    ) or
    (
      (hostvars['oim']['pulp_container_status'] == 'running') and
      (pulp_status_output.rc == 0) and
      (not file_check.stat.exists)
    ) or
    (
      (pulp_status_output.rc != 0) and
      (not file_check.stat.exists)
    )
  block:
    - name: Set cert_san fact based on hostname
      ansible.builtin.set_fact:
        cert_san: subjectAltName=IP:{{ cert_san_ip }},DNS:{{ pulp_server_ip }},DNS:pulp,DNS:localhost
      when: hostvars['oim']['hostname_enabled']
      no_log: true

    - name: Set cert_san fact based on IP
      ansible.builtin.set_fact:
        cert_san: subjectAltName=IP:{{ pulp_server_ip }},DNS:pulp,DNS:localhost
      when: not hostvars['oim']['hostname_enabled']
      no_log: true

    - name: Generating Pulp SSL Certificate
      ansible.builtin.command:
        cmd: "{{ generate_cert_cmd }}"
      changed_when: false

    - name: Ensure the pulp group exists
      ansible.builtin.group:
        name: pulp
        state: present

    - name: Change group ownership of SSL certificate and key
      ansible.builtin.file:
        path: "{{ item }}"
        group: pulp
        state: file
      loop: "{{ cert_items.values() }}"

    - name: Copy Pulp crt to container trust
      ansible.builtin.copy:
        src: "{{ pulp_cert_src }}"
        dest: "{{ ca_trust_path }}"
        mode: "{{ logs_dir_permission }}"

    - name: Add Pulp Certificate to TrustStore
      ansible.builtin.command:
        cmd: update-ca-trust extract
      changed_when: false

    - name: Create a track file
      ansible.builtin.file:
        path: "{{ track_file_path }}"
        state: touch
        mode: "{{ logs_dir_permission }}"

    - name: Record current timestamp in track file
      ansible.builtin.copy:
        dest: "{{ track_file_path }}"
        content: "Timestamp: {{ ansible_date_time.iso8601 }}"
        mode: "{{ logs_dir_permission }}"

# CERT GENERATION USING community.crypto x509_certificate MODULE
# - name: Generate private key
#   community.crypto.openssl_privatekey:
#     path: "{{ cert_items.key_path }}"
#     size: 2048
#     type: RSA
#     mode: '0600'

# - name: Generate CSR with SAN and key usages
#   community.crypto.openssl_csr:
#     path: "{{ cert_items.csr_path }}"
#     privatekey_path: "{{ cert_items.key_path }}"
#     common_name: "{{ oim_hostname }}"
#     subject_alt_name:
#       - "IP:0.0.0.0"
#       - "DNS:pulp"
#       - "DNS:{{ oim_hostname }}"
#       - "DNS:localhost"
#     key_usage:
#       - digitalSignature
#       - keyEncipherment
#     extended_key_usage:
#       - serverAuth
#     basic_constraints:
#       - "CA:TRUE"
#     mode: '0644'

# - name: Generate self-signed certificate (no command module)
#   community.crypto.x509_certificate:
#     path: "{{ cert_items.crt_path }}"
#     privatekey_path: "{{ cert_items.key_path }}"
#     provider: selfsigned
#     # selfsigned_not_before: "now"
#     selfsigned_not_after: "+365d"
#     selfsigned_version: 3
#     selfsigned_create_subject_key_identifier: always_create
#     return_content: true


================================================
FILE: prepare_oim/roles/deploy_containers/pulp/tasks/deploy_pulp_container_http.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

---
- name: Create directories for Pulp in shared storage
  ansible.builtin.file:
    path: "{{ item.path }}"
    state: directory
    mode: "{{ item.mode }}"
  loop: "{{ pulp_directories_http }}"

- name: Create settings.py for Pulp
  ansible.builtin.template:
    src: "{{ settings_tmp_path }}"
    dest: "{{ settings_py_path }}"
    mode: "{{ pulp_dir_permissions }}"

- name: Deploy Pulp container and check deployment status
  block:
    - name: Create quadlet file
      ansible.builtin.template:
        src: "http_quadlet.j2"
        dest: "/etc/containers/systemd/{{ pulp_container_name }}.container"
        mode: "0644"
      register: quad_out

    - name: Reload daemon if changes
      ansible.builtin.systemd_service:
        daemon_reload: true
      when: quad_out.changed # noqa: no-handler

    - name: Make sure container unit is running
      ansible.builtin.systemd_service:
        state: started
        name: "{{ pulp_container_name }}"
        enabled: true
      no_log: true

    - name: Check if Pulp container is already running
      containers.podman.podman_container_info:
        name: "{{ pulp_container_name }}"
      register: pulp_running_check
      failed_when: false

    - name: Check current timeout setting in running Pulp container
      containers.podman.podman_container_exec:
        name: "{{ pulp_container_name }}"
        command: python3 -c "import aiohttp; print(aiohttp.client.DEFAULT_TIMEOUT.total if hasattr(aiohttp.client, 'DEFAULT_TIMEOUT') else 'not_set')"
      register: current_timeout
      failed_when: false
      when:
        - pulp_running_check.containers | length > 0
        - pulp_running_check.containers[0].State.Status == 'running'

    - name: Determine if timeout is already correct
      ansible.builtin.set_fact:
        timeout_correct: "{{ (current_timeout.rc | default(1) == 0) and (current_timeout.stdout | default('') | trim == '7200') }}"

    - name: Restart pulp container
      ansible.builtin.systemd_service:
        state: restarted
        name: "{{ pulp_container_name }}"
      when: quad_out.changed or not timeout_correct # noqa: no-handler
      no_log: true

    - name: Check if Pulp container is running after deployment
      containers.podman.podman_container_info:
        name: "{{ pulp_container_name }}"
      register: pulp_container_status

    - name: Notify user of Pulp container deployment status
      ansible.builtin.debug:
        msg: "{{ pulp_deployed_msg }}"
      when:
        - pulp_container_status.containers | length > 0
        - pulp_container_status.containers[0].State.Status == 'running'

  rescue:
    - name: Pulp container deployment failed
      ansible.builtin.fail:
        msg: "{{ pulp_deployed_fail_msg }}"

- name: Reset Pulp Password
  containers.podman.podman_container_exec:
    name: "{{ pulp_container_name }}"
    command: "{{ reset_password_cmd }}"
  retries: "{{ retries_var }}"
  delay: "{{ delay_var }}"
  when: pulp_password | length > 1
  no_log: true


================================================
FILE: prepare_oim/roles/deploy_containers/pulp/tasks/deploy_pulp_container_https.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

---
- name: Create directories for Pulp in shared storage
  ansible.builtin.file:
    path: "{{ item.path }}"
    state: directory
    mode: "{{ item.mode }}"
  loop: "{{ pulp_directories_https }}"

- name: Create nginx.conf file for Pulp
  ansible.builtin.template:
    src: "{{ nginx_conf_path }}"
    dest: "{{ nginx_conf_dest }}"
    mode: "{{ pulp_dir_permissions }}"

- name: Create settings.py for Pulp
  ansible.builtin.template:
    src: "{{ settings_tmp_path }}"
    dest: "{{ settings_py_path }}"
    mode: "{{ pulp_dir_permissions }}"

- name: Deploy Pulp container and check deployment status
  block:
    - name: Create quadlet file
      ansible.builtin.template:
        src: "https_quadlet.j2"
        dest: "/etc/containers/systemd/{{ pulp_container_name }}.container"
        mode: "0644"
      register: quad_out

    - name: Reload daemon if changes
      ansible.builtin.systemd_service:
        daemon_reload: true
      when: quad_out.changed # noqa: no-handler

    - name: Make sure container unit is running
      ansible.builtin.systemd_service:
        state: started
        name: "{{ pulp_container_name }}"
        enabled: true
      no_log: true

    - name: Check if Pulp container is already running
      containers.podman.podman_container_info:
        name: "{{ pulp_container_name }}"
      register: pulp_running_check
      failed_when: false

    - name: Check current timeout setting in running Pulp container
      containers.podman.podman_container_exec:
        name: "{{ pulp_container_name }}"
        command: python3 -c "import aiohttp; print(aiohttp.client.DEFAULT_TIMEOUT.total if hasattr(aiohttp.client, 'DEFAULT_TIMEOUT') else 'not_set')"
      register: current_timeout
      failed_when: false
      when:
        - pulp_running_check.containers | length > 0
        - pulp_running_check.containers[0].State.Status == 'running'

    - name: Determine if timeout is already correct
      ansible.builtin.set_fact:
        timeout_correct: "{{ (current_timeout.rc | default(1) == 0) and (current_timeout.stdout | default('') | trim == '7200') }}"

    - name: Restart pulp container
      ansible.builtin.systemd_service:
        state: restarted
        name: "{{ pulp_container_name }}"
      when: quad_out.changed or not timeout_correct # noqa: no-handler
      no_log: true

    - name: Check if Pulp container is running after deployment
      containers.podman.podman_container_info:
        name: "{{ pulp_container_name }}"
      register: pulp_container_status

    - name: Notify user of Pulp container deployment status
      ansible.builtin.debug:
        msg: "{{ pulp_deployed_msg }}"
      when:
        - pulp_container_status.containers | length > 0
        - pulp_container_status.containers[0].State.Status == 'running'

  rescue:
    - name: Pulp container deployment failed
      ansible.builtin.fail:
        msg: "{{ pulp_deployed_fail_msg }}"

- name: Set fact for container status
  ansible.builtin.set_fact:
    pulp_container_status: "{{ pulp_container_status.containers[0].State.Status }}"

- name: Reset Pulp Password
  containers.podman.podman_container_exec:
    name: "{{ pulp_container_name }}"
    command: "{{ reset_password_cmd }}"
  retries: "{{ retries_var }}"
  delay: "{{ delay_var }}"
  when: pulp_password | length > 1
  no_log: true


================================================
FILE: prepare_oim/roles/deploy_containers/pulp/tasks/deployment_prereq.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

---

- name: Set fact for hostname enabled
  ansible.builtin.set_fact:
    hostname_enabled: false # Will be set to 'true' if user provides hostname in high_availability_config.yml

- name: Set pulp_protocol_https globally
  ansible.builtin.set_fact:
    pulp_protocol_https: "{{ pulp_protocol_https }}"
  delegate_to: localhost
  run_once: true

- name: Configure Pulp Server with Admin IP or VIP
  ansible.builtin.set_fact:
    pulp_server_ip: "{{ hostvars['localhost']['admin_nic_ip'] }}"
    pulp_password: "{{ hostvars['localhost']['pulp_password'] }}"
  when: not hostname_enabled
  no_log: true

- name: Configure Pulp Server with hostname when hostname_enabled is true
  ansible.builtin.set_fact:
    pulp_server_ip: "" # Placeholder for Pulp hostname
    pulp_password: "{{ hostvars['localhost']['pulp_password'] }}"
  when: hostname_enabled
  no_log: true

- name: Check if Pulp image already exists
  ansible.builtin.command:
    cmd: "podman image exists {{ pulp_image }}"
  register: pulp_image_exists
  changed_when: false
  failed_when: false

- name: Pull Pulp image using Podman when missing
  ansible.builtin.command:
    cmd: "podman pull {{ pulp_image }}"
  register: pulp_pull_result
  retries: "{{ pull_image_retries }}"
  delay: "{{ pull_image_delay }}"
  until: pulp_pull_result is not failed
  changed_when: false
  when: pulp_image_exists.rc != 0

- name: Fail if Pulp image pull failed
  ansible.builtin.fail:
    msg: "Failed to pull Pulp image: {{ pulp_image }}. Error: {{ pulp_pull_result.stderr }}"
  when:
    - pulp_image_exists.rc != 0
    - pulp_pull_result.rc is defined
    - pulp_pull_result.rc != 0

- name: Invoke Pulp Container Deployment Tasks for HTTP
  ansible.builtin.include_tasks: deploy_pulp_container_http.yml
  when: not pulp_protocol_https

- name: Invoke Pulp Container Deployment Tasks for HTTPS
  ansible.builtin.include_tasks: deploy_pulp_container_https.yml
  when: pulp_protocol_https


================================================
FILE: prepare_oim/roles/deploy_containers/pulp/tasks/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

---
- name: Deploy pulp container tasks
  ansible.builtin.include_tasks: deployment_prereq.yml


================================================
FILE: prepare_oim/roles/deploy_containers/pulp/tasks/reload_pulp_nginx.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

---
- name: Run nginx reload command on Pulp container
  containers.podman.podman_container_exec:
    name: "{{ pulp_container_name }}"
    command: "{{ nginx_reload_cmd }}"
  retries: "{{ nginx_retries_var }}"
  delay: "{{ delay_var_sixty }}"
  register: nginx_reload_result
  until: nginx_reload_result.rc == 0

- name: Check if Pulp endpoint is up
  ansible.builtin.uri:
    url: "{{ pulp_status_url }}"
    method: GET
    validate_certs: false
    return_content: true
  register: result
  retries: "{{ endpoint_retries }}"
  delay: "{{ endpoint_delay }}"
  timeout: "{{ endpoint_timeout }}"
  until: result.status == 200


================================================
FILE: prepare_oim/roles/deploy_containers/pulp/templates/http_quadlet.j2
================================================
[Unit]
Description=Pulp http Quadlet Container
[Container]
Image={{ pulp_image }}
Exec=/init
ContainerName={{ pulp_container_name }}
AddDevice={{ device_name }}
HostName={{ pulp_container_name }}
PodmanArgs=--privileged
# Volumes
{% for vol in volumes_http %}
Volume={{ vol }}
{% endfor %}

# Environment
Environment=PULP_HTTPS=false
{% for env_arg in arg_list %}
PodmanArgs={{ env_arg }}
{% endfor %}
# HTTPS Port mapping
PublishPort={{ pulp_port }}
[Service]
Restart=always
[Install]
WantedBy=multi-user.target default.target

================================================
FILE: prepare_oim/roles/deploy_containers/pulp/templates/https_quadlet.j2
================================================
[Unit]
Description=Pulp https Quadlet Container
[Container]
Image={{ pulp_image }}
Exec=/init
ContainerName={{ pulp_container_name }}
AddDevice={{ device_name }}
HostName={{ pulp_container_name }}
PodmanArgs=--privileged
# Volumes
{% for vol in volumes_https %}
Volume={{ vol }}
{% endfor %}

# Environment
Environment=PULP_HTTPS=true
Environment=PULP_TLS_CERT=/etc/pulp/certs/pulp.crt
Environment=PULP_TLS_KEY=/etc/pulp/certs/pulp.key
{% for env_arg in arg_list %}
PodmanArgs={{ env_arg }}
{% endfor %}

# HTTPS Port mapping
PublishPort={{ pulp_port_https }}
[Service]
Restart=always
[Install]
WantedBy=multi-user.target default.target

================================================
FILE: prepare_oim/roles/deploy_containers/pulp/templates/nginx_conf.j2
================================================
# TODO: Support IPv6.
# TODO: Maybe serve multiple `location`s, not just one.

# The "nginx" package on fedora creates this user and group.
user nginx nginx;
# Gunicorn docs suggest this value.
worker_processes {{ nginx_template_vars.worker_processes }};
daemon off;
events {
    worker_connections {{ nginx_template_vars.worker_connections }};  # increase if you have lots of clients
    accept_mutex {{ nginx_template_vars.accept_mutex }};  # set to 'on' if nginx worker_processes > 1
}

http {
    include mime.types;
    # fallback in case we can't determine a type
    default_type application/octet-stream;
    sendfile on;

    # If left at the default of 1024, nginx emits a warning about being unable
    # to build optimal hash types.
    types_hash_max_size {{ nginx_template_vars.types_hash_max_size }};

    upstream pulp-content {
         server {{ nginx_template_vars.server_content_ip }}:{{ nginx_template_vars.pulp_content_port }};
    }

    upstream pulp-api {
         server {{ nginx_template_vars.server_api_ip }}:{{ nginx_template_vars.pulp_api_port }};
    }

    server {
        # Gunicorn docs suggest the use of the "deferred" directive on Linux.
        listen {{ pulp_container_port_https }} ssl deferred;

        # SSL certificates
        ssl_certificate {{ nginx_template_vars.pulp_server_crt_path }};
        ssl_certificate_key {{ nginx_template_vars.pulp_server_key_path }};
        # listen {{ nginx_template_vars.http_port }} default_server deferred;
        server_name {{ pulp_server_ip }};

        # The default client_max_body_size is 1m. Clients uploading
        # files larger than this will need to chunk said files.
        client_max_body_size {{ nginx_template_vars.client_max_body_size }};

        # Gunicorn docs suggest this value.
        keepalive_timeout {{ nginx_template_vars.keepalive_timeout }};

        location /pulp/content/ {
            proxy_set_header X-Forwarded-For $proxy_add_x_forwarded_for;
            proxy_set_header X-Forwarded-Proto $scheme;
            proxy_set_header Host $http_host;
            # we don't want nginx trying to do something clever with
            # redirects, we set the Host: header above already.
            proxy_redirect off;
            proxy_pass http://pulp-content;
        }

        location /pulp/api/v3/ {
            proxy_set_header X-Forwarded-For $proxy_add_x_forwarded_for;
            proxy_set_header X-Forwarded-Proto $scheme;
            proxy_set_header Host $http_host;
            # we don't want nginx trying to do something clever with
            # redirects, we set the Host: header above already.
            proxy_redirect off;
            proxy_pass http://pulp-api;
            client_max_body_size 0;
        }

        location /auth/login/ {
            proxy_set_header X-Forwarded-For $proxy_add_x_forwarded_for;
            proxy_set_header X-Forwarded-Proto $scheme;
            proxy_set_header Host $http_host;
            # we don't want nginx trying to do something clever with
            # redirects, we set the Host: header above already.
            proxy_redirect off;
            proxy_pass http://pulp-api;
        }

        include pulp/*.conf;

        location /static/pulp_ui/ {
            root /var/lib/operator/;
            try_files $uri /static/pulp_ui/index.html;
        }
        location /ui/ {
            alias /var/lib/operator/static/pulp_ui/;
            try_files $uri /static/pulp_ui/index.html;
        }
        location /pulp-ui-config.json {
            root /var/lib/operator/static/pulp_ui/;
        }

        location / {
            proxy_set_header X-Forwarded-For $proxy_add_x_forwarded_for;
            proxy_set_header X-Forwarded-Proto $scheme;
            proxy_set_header Host $http_host;
            # we don't want nginx trying to do something clever with
            # redirects, we set the Host: header above already.
            proxy_redirect off;
            proxy_pass http://pulp-api;
            # most pulp static files are served through whitenoise
            # http://whitenoise.evans.io/en/stable/
        }
    }
    server {
        listen {{ nginx_template_vars.http_port }};
        server_name {{ pulp_server_ip }};

        # Redirect HTTP to HTTPS
        return 301 https://{{ pulp_server_ip }}:{{ pulp_container_port_https }}$request_uri;
    }
}


================================================
FILE: prepare_oim/roles/deploy_containers/pulp/templates/settings_template.j2
================================================
{% if pulp_protocol_https %}
CONTENT_ORIGIN='https://{{ pulp_server_ip }}:{{ pulp_container_port_https }}'
{% else %}
CONTENT_ORIGIN='http://{{ pulp_server_ip }}:{{ pulp_container_port_http }}'
{% endif %}
TOKEN_AUTH_DISABLED=True
{% set chars = 'abcdefghijklmnopqrstuvwxyz0123456789!@#$%^&*(-_=+)' %}
{% set random_key = [] -%}
{% for _ in range(50) -%}
    {% set _ = random_key.append(chars | random) %}
{% endfor -%}
{% set random_key = ''.join(random_key) -%}
SECRET_KEY='{{ random_key }}'
import aiohttp
aiohttp.client.DEFAULT_TIMEOUT = aiohttp.ClientTimeout(total=7200, sock_connect=600, sock_read=600)


================================================
FILE: prepare_oim/roles/deploy_containers/pulp/vars/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

---
shared_storage_path: "{{ oim_shared_path }}/omnia"
pulp_shared_path: "{{ shared_storage_path }}/pulp"
pulp_logs_dir: "{{ oim_shared_path }}/omnia/log/pulp"
pulp_dir_permissions: "0755"
pulp_pgsql_dir_permissions: "0750"
logs_dir_permission: "0644"
pulp_ha_dir: "/opt/omnia/pulp/pulp_ha"
settings_py_path: "{{ pulp_shared_path }}/settings/settings.py"
device_name: "/dev/fuse:/dev/fuse:rwm"
pulp_container_name: "pulp"
pulp_protocol_https: true
# Tag is fixed for the Pulp container image as of 10-06-2025
pulp_image: "docker.io/pulp/pulp:3.80"

# Usage: deployment_prereq.yml - pull image retries
pull_image_retries: 5
pull_image_delay: 10

arg_list:
  - "-e PULP_WORKERS=10"
  - "-e PULP_API_WORKERS=10"
  - "-e PULP_CONTENT_WORKERS=10"
  - "-e PULP_GUNICORN_TIMEOUT=30"
  - "-e PULP_API_WORKERS_MAX_REQUESTS=1000"
  - "-e PULP_API_WORKERS_MAX_REQUESTS_JITTER=50"
pulp_deployed_msg: "The {{ pulp_container_name }} container has been successfully deployed."
pulp_deployed_fail_msg:
  "The {{ pulp_container_name }} container deployment failed. Common causes:
  • Missing or inaccessible pulp container image
  • Pulp service not starting successfully
  • NFS storage not reachable or not mounted
  Run utility/oim_cleanup.yml to cleanup, then re-run the playbook to deploy the {{ pulp_container_name }}
  container successfully."
retries_var: 8
delay_var: 30
delay_var_sixty: 30
timeout_var: 60
reset_password_cmd: bash -c "pulpcore-manager reset-admin-password --password {{ pulp_password }}"

# Usage: deploy_pulp_container_http.yml
pulp_directories_http:
  - { path: "{{ pulp_shared_path }}", mode: "{{ pulp_dir_permissions }}" }
  - { path: "{{ pulp_logs_dir }}", mode: "{{ logs_dir_permission }}" }
  - { path: "{{ pulp_shared_path }}/settings/certs", mode: "{{ pulp_dir_permissions }}" }
  - { path: "{{ pulp_shared_path }}/settings/pulp_storage", mode: "{{ pulp_dir_permissions }}" }
  - { path: "{{ pulp_shared_path }}/settings/pgsql", mode: "{{ pulp_pgsql_dir_permissions }}" }
  - { path: "{{ pulp_shared_path }}/settings/containers", mode: "{{ pulp_dir_permissions }}" }
  - { path: "{{ pulp_shared_path }}/pulp_ha", mode: "{{ pulp_dir_permissions }}" }
pulp_container_port_http: "2225"
pulp_port: "2225:80"
volumes_http:
  - "{{ pulp_shared_path }}/settings:/etc/pulp{{ selinux_option }}"
  - "{{ pulp_shared_path }}/settings/pulp_storage:/var/lib/pulp{{ selinux_option }}"
  - "{{ pulp_shared_path }}/settings/pgsql:/var/lib/pgsql{{ selinux_option }}"
  - "{{ pulp_shared_path }}/settings/containers:/var/lib/containers{{ selinux_option }}"
  - "{{ shared_storage_path }}/log/pulp:/var/log/pulp{{ selinux_option }}"
  - "{{ pulp_shared_path }}/pulp_ha:/root/.config/pulp{{ selinux_option }}"

# Usage: deploy_pulp_container_https.yml
certs_dir: "/opt/omnia/pulp/settings/certs"
pulp_directories_https:
  - { path: "{{ pulp_shared_path }}", mode: "{{ pulp_dir_permissions }}" }
  - { path: "{{ pulp_logs_dir }}", mode: "{{ logs_dir_permission }}" }
  - { path: "{{ pulp_shared_path }}/settings/certs", mode: "{{ pulp_dir_permissions }}" }
  - { path: "{{ pulp_shared_path }}/settings/pulp_storage", mode: "{{ pulp_dir_permissions }}" }
  - { path: "{{ pulp_shared_path }}/settings/pgsql", mode: "{{ pulp_pgsql_dir_permissions }}" }
  - { path: "{{ pulp_shared_path }}/settings/containers", mode: "{{ pulp_dir_permissions }}" }
  - { path: "{{ pulp_shared_path }}/pulp_ha", mode: "{{ pulp_dir_permissions }}" }
  - { path: "{{ pulp_shared_path }}/nginx", mode: "{{ pulp_dir_permissions }}" }
nginx_conf_path: "{{ role_path }}/templates/nginx_conf.j2"
nginx_conf_dest: "{{ pulp_shared_path }}/nginx/nginx.conf"
settings_tmp_path: "{{ role_path }}/templates/settings_template.j2"
volumes_https:
  - "{{ pulp_shared_path }}/settings:/etc/pulp{{ selinux_option }}"
  - "{{ pulp_shared_path }}/settings/pulp_storage:/var/lib/pulp{{ selinux_option }}"
  - "{{ pulp_shared_path }}/settings/pgsql:/var/lib/pgsql{{ selinux_option }}"
  - "{{ pulp_shared_path }}/settings/containers:/var/lib/containers{{ selinux_option }}"
  - "{{ shared_storage_path }}/log/pulp:/var/log/pulp{{ selinux_option }}"
  - "{{ pulp_shared_path }}/pulp_ha:/root/.config/pulp{{ selinux_option }}"
  - "{{ pulp_shared_path }}/nginx/nginx.conf:/etc/nginx/nginx.conf:ro{{ selinux_option | replace(':', ',') }}"
pulp_container_port_https: "2225"
pulp_port_https: "2225:2225"

# Usage: nginx_conf.j2
nginx_template_vars:
  worker_processes: 1
  worker_connections: 1024
  accept_mutex: 'off'
  types_hash_max_size: 4096
  server_content_ip: 127.0.0.1
  pulp_content_port: 24816
  server_api_ip: 127.0.0.1
  pulp_api_port: 24817
  pulp_server_crt_path: "/etc/pulp/certs/pulp_webserver.crt"
  pulp_server_key_path: "/etc/pulp/certs/pulp_webserver.key"
  http_port: 80
  client_max_body_size: 10m
  keepalive_timeout: 5

# Usage: create_pulp_config_http.yml
pulp_config_cmd_http: "pulp config create --username admin  --base-url http://{{ pulp_server_ip }}:{{ pulp_container_port_http }} --password {{ pulp_password }} --location {{ pulp_ha_dir }}/cli.toml" # noqa: yaml[line-length]
pulp_config_cmd_overwrite_http: "pulp config create --username admin  --base-url http://{{ pulp_server_ip }}:{{ pulp_container_port_http }} --password {{ pulp_password }} --location {{ pulp_ha_dir }}/cli.toml --overwrite" # noqa: yaml[line-length]

# Usage: create_pulp_config_https.yml
pulp_config_cmd_https: "pulp config create --username admin  --base-url https://{{ pulp_server_ip }}:{{ pulp_container_port_https }} --password {{ pulp_password }} --location {{ pulp_ha_dir }}/cli.toml --no-verify-ssl" # noqa: yaml[line-length]
pulp_config_cmd_overwrite_https: "pulp config create --username admin  --base-url https://{{ pulp_server_ip }}:{{ pulp_container_port_https }} --password {{ pulp_password }} --location {{ pulp_ha_dir }}/cli.toml --no-verify-ssl --overwrite" # noqa: yaml[line-length]
pulp_config_filepath: "{{ pulp_ha_dir }}/cli.toml"
config_default_dir: "/root/.config/pulp/"
config_default_loc: "{{ config_default_dir }}/cli.toml"
track_file_path: /opt/omnia/pulp/pulp_crt_track.txt
cert_san_ip: 0.0.0.0
cert_validity_days: 365
cert_items:
  crt_path: "{{ certs_dir }}/pulp_webserver.crt"
  key_path: "{{ certs_dir }}/pulp_webserver.key"

generate_cert_cmd: >
  openssl req -x509 -nodes -newkey rsa:2048
  -keyout {{ cert_items.key_path }}
  -out {{ cert_items.crt_path }}
  -days {{ cert_validity_days }}
  -subj "/CN={{ pulp_server_ip }}"
  -addext {{ cert_san }}

pulp_cert_src: "/opt/omnia/pulp/settings/certs/pulp_webserver.crt"
ca_trust_path: "/etc/pki/ca-trust/source/anchors/"

# Usage: reload_pulp_nginx.yml
nginx_reload_cmd: "nginx -s reload"
nginx_retries_var: 11
omnia_container_name: "omnia_core"
pulp_status_url: "https://{{ pulp_server_ip }}:{{ pulp_container_port_https }}/pulp/api/v3/status/"
endpoint_retries: 10
endpoint_delay: 10
endpoint_timeout: 60


================================================
FILE: prepare_oim/roles/prepare_oim_validation/tasks/check_k8s_support.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# Check if service_k8s is mentioned in software_config.json
- name: Set facts
  ansible.builtin.set_fact:
    k8s_support: "{{ software_config.softwares | selectattr('name', 'in', ['service_k8s']) | list | length > 0 }}"
    project_input_path: "{{ hostvars['localhost']['input_project_dir'] }}"
    cluster_os_type: "{{ software_config.cluster_os_type }}"
    cluster_os_version: "{{ software_config.cluster_os_version }}"
    k8s_support_check: true
    k8s_arch: []

- name: Validate service k8s
  when: k8s_support
  block:
    - name: Extract service k8s version
      ansible.builtin.set_fact:
        k8s_versions: "{{ software_config.softwares | selectattr('name', 'in', ['compute_k8s', 'service_k8s']) | map(attribute='version') | list | unique }}" # noqa: yaml[line-length]
        k8s_arch: "{{ (software_config.softwares | selectattr('name', 'in', ['compute_k8s', 'service_k8s']) | first).get('arch', default_archs) }}"

    - name: Set k8s_support_check to false if any k8s version is not default_k8s_version
      ansible.builtin.set_fact:
        k8s_support_check: false
      when: (k8s_versions | select('ne', default_k8s_version) | list | length) > 0

    - name: Fail if unsupported service_k8s version is detected
      ansible.builtin.fail:
        msg: "{{ fail_msg }}"
      when: not k8s_support_check


================================================
FILE: prepare_oim/roles/prepare_oim_validation/tasks/check_openldap_support.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.

---

# Check if openldap is mentioned in software_config.json
- name: Check if openldap support is true
  ansible.builtin.set_fact:
    openldap_support: "{{ software_config.softwares | selectattr('name', 'equalto', 'openldap') | list | length > 0 }}"


================================================
FILE: prepare_oim/roles/prepare_oim_validation/tasks/include_local_repo_config.yml
================================================
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Check that the local_repo_config.yml exists
  ansible.builtin.stat:
    path: "{{ local_repo_config_file }}"
  register: stat_result

- name: Fail if local_repo_config.yml file doesn't exist
  ansible.builtin.fail:
    msg: "{{ fail_msg_local_repo_config_file }}"
  when: not stat_result.stat.exists

- name: Include variable file local_repo_config.yml
  block:
    - name: Include variable file local_repo_config.yml
      ansible.builtin.include_vars: "{{ local_repo_config_file }}"
      register: include_local_repo_config
      no_log: true
  rescue:
    - name: Failed to include local_repo_config.yml
      ansible.builtin.fail:
        msg: "{{ local_repo_config_syntax_fail_msg }} Possible Syntax Error Hints: {{ include_local_repo_config.message }}"


================================================
FILE: prepare_oim/roles/prepare_oim_validation/tasks/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Validate passwordless ssh host
  ansible.builtin.include_tasks: validate_passwordless_ssh_oim.yml

- name: Include provision_validation_vars role vars
  ansible.builtin.include_tasks: pre_requisite.yml

- name: Validate network spec
  ansible.builtin.include_tasks: validate_network_spec.yml

- name: Include local_repo_config vars
  ansible.builtin.include_tasks: include_local_repo_config.yml

- name: Check k8s support
  ansible.builtin.include_tasks: check_k8s_support.yml

- name: Check openldap support
  ansible.builtin.include_tasks: check_openldap_support.yml


================================================
FILE: prepare_oim/roles/prepare_oim_validation/tasks/pre_requisite.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Include metadata vars
  ansible.builtin.include_vars: "{{ omnia_metadata_file }}"
  register: include_metadata
  no_log: true

- name: Load software_config.json as software_config
  block:
    - name: Load software_config.json as user_config
      ansible.builtin.include_vars:
        file: "{{ software_config_file }}"
        name: software_config
      register: include_software_config
      no_log: true
  rescue:
    - name: Failed to load software_config.json as user_config
      ansible.builtin.fail:
        msg: "{{ software_config_syntax_fail_msg }} Error: {{ include_software_config.message }}"


================================================
FILE: prepare_oim/roles/prepare_oim_validation/tasks/validate_network_spec.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Include provision_config.yml
  block:
    - name: Include provision_config.yml file
      ansible.builtin.include_vars: "{{ provision_config }}"
      register: include_provision_config
      no_log: true
      tags: init
  rescue:
    - name: Failed to include provision_config.yml
      ansible.builtin.fail:
        msg: "{{ provision_config_syntax_fail_msg }} Error: {{ include_provision_config.message }}"

- name: Include network_spec.yml
  block:
    - name: Include network_spec file
      ansible.builtin.include_vars: "{{ network_spec }}"
      register: include_network_spec
      no_log: true
      tags: init
  rescue:
    - name: Failed to include network_spec.yml
      ansible.builtin.fail:
        msg: "{{ network_spec_syntax_fail_msg }} Error: {{ include_network_spec.message }}"

- name: Parse network_spec data
  ansible.builtin.set_fact:
    network_data: "{{ network_data | default({}) | combine({item.key: item.value}) }}"
  with_dict: "{{ Networks }}"

- name: Set admin network nic and ip
  ansible.builtin.set_fact:
    admin_nic_ip: "{{ network_data.admin_network.primary_oim_admin_ip }}"
    admin_nic: "{{ network_data.admin_network.oim_nic_name }}"
    admin_netmask_bits: "{{ network_data.admin_network.netmask_bits }}"
    ntp_servers: "{{ network_data.admin_network.ntp_servers }}"

- name: Ensure NIC exists on the system
  ansible.builtin.assert:
    that:
      - admin_nic in ansible_facts.interfaces
    fail_msg: "{{ admin_nic_fail_msg }}"
    success_msg: "{{ admin_nic_success_msg }}"

- name: Get all IPv4 addresses assigned to the NIC
  ansible.builtin.set_fact:
    admin_nic_ips: >-
      {{
        ([ansible_facts[admin_nic].ipv4.address] | default([])) +
        (ansible_facts[admin_nic].ipv4_secondaries | default([]) | map(attribute='address') | list)
      }}

- name: Fetch OIM hostname
  ansible.builtin.command: hostname
  changed_when: false
  register: fetch_oim_hostname
  delegate_to: oim
  connection: ssh

- name: Validate admin_nic_ip is assigned to the NIC
  ansible.builtin.assert:
    that:
      - admin_nic_ip in admin_nic_ips
    fail_msg: "{{ admin_nic_ip_fail_msg }}"
    success_msg: "{{ admin_nic_ip_success_msg }}"
  when: fetch_oim_hostname.stdout in oim_hostname

- name: Compute network address using ipcalc
  ansible.builtin.command: "/usr/bin/ipcalc -n {{ admin_nic_ip }}/{{ admin_netmask_bits }}"
  register: network_address_output
  changed_when: false

- name: Extract network address
  ansible.builtin.set_fact:
    admin_net_addr: "{{ network_address_output.stdout.split('=')[1] }}"

- name: Initialize network_interface_type
  ansible.builtin.set_fact:
    network_interface_type: ""
    bmc_details_status: false

- name: Checking BMC network input
  ansible.builtin.set_fact:
    bmc_details_status: true
  when:
    - network_data.bmc_network.oim_nic_name | default("", true) | length > 0
    - network_data.bmc_network.netmask_bits | default("", true) | length > 0
    - network_data.bmc_network.dynamic_range | default("", true) | length > 0


================================================
FILE: prepare_oim/roles/prepare_oim_validation/tasks/validate_passwordless_ssh_oim.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Validate passwordless ssh oim
  block:
    - name: Check ssh connection using command
      ansible.builtin.command: ssh -o StrictHostKeyChecking=no -p {{ oim_ssh_port }} localhost
      changed_when: true
      register: ssh_connection
  rescue:
    - name: SSH connection failed
      ansible.builtin.fail:
        msg: "{{ ssh_connection_fail_msg }}"


================================================
FILE: prepare_oim/roles/prepare_oim_validation/vars/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# Usage: main.yml
provision_shared_library_path: "/opt/omnia/shared_libraries/provision"
xcat_root_env: "/opt/xcat"
xcat_path_env: "/opt/xcat/bin:/opt/xcat/sbin:/opt/xcat/share/xcat/tools"
xcat_manpath_env: "/opt/xcat/share/man:$MANPATH"
perl_badlang_env: 0
xcat_path: /opt/xcat/bin

# Usage: validate_passwordless_ssh_oim.yml
oim_ssh_port: 22
ssh_connection_fail_msg: "Failed. SSH connection failed. Please verify passwordless ssh from omnia_core to oim host."

# Usage: pre_requisite.yml
software_config_file: "{{ input_project_dir }}/software_config.json"
invalid_software_config_fail_msg: "Failed. Please provide valid software_config.json file with cluster_os_type, cluster_os_version, repo_config and repo_config values." # noqa: yaml[line-length]
software_config_syntax_fail_msg: "Failed. Syntax errors present in software_config.json. Fix errors and re-run playbook again."
file_permission: "0755"

# Usage: check_k8s_support.yml
fail_msg_k8s_version: "Failed. Kubernetes Version is unsupported or incorrect in software_config.json. Update software_config.json with a supported Kubernetes versions and re-run the playbook.Supported versions are - {{ supported_k8s_version }}" # noqa: yaml[line-length]
invalid_k8s_versions: "{{ k8s_versions | select('ne', default_k8s_version) | list }}"
fail_msg: >-
    service_k8s is not supported for version: {{ invalid_k8s_versions }}.
    Please update the service_k8s version in software_config.json to {{ default_k8s_version }}
    and rerun the playbook.
default_k8s_version: "1.34.1"

# Usage: validate_network_spec.yml
network_spec: "{{ input_project_dir }}/network_spec.yml"
network_spec_syntax_fail_msg: "Failed. Syntax errors present in network_spec.yml. Fix errors and re-run playbook again."
admin_nic_fail_msg: "NIC '{{ admin_nic }}' does not exist on the system. Provide valid admin_network details in network_spec.yml and re-run the playbook."
admin_nic_success_msg: "NIC '{{ admin_nic }}' exists on the system."
admin_nic_ip_fail_msg: "IP '{{ admin_nic_ip }}' is not assigned to NIC '{{ admin_nic }}'. Please configure the admin IP in OIM and re-run the playbook."
admin_nic_ip_success_msg: "IP '{{ admin_nic_ip }}' is assigned to NIC '{{ admin_nic }}'."
provision_config: "{{ input_project_dir }}/provision_config.yml"
provision_config_syntax_fail_msg: "Failed. Syntax errors present in provision_config.yml. Fix errors and re-run playbook again."

# Usage: validate_credentials.yml
min_length: 8
max_length: 30
pulp_creds_fail_msg:
  Both Pulp username and password are required.
  Kindly check the pulp_password in input/omnia_config_credentials.yml.

pulp_pwd_min_length: 5
pulp_password_fail_msg: "Failed. pulp_password should have minimum 5 characters in omnia_config_credentials.yml"

# Usage: include_local_repo_config.yml
fail_msg_local_repo_config_file: "local_repo_config.yml file doesn't exist."
input_project_dir: "{{ hostvars['localhost']['input_project_dir'] }}"
local_repo_config_file: "{{ input_project_dir }}/local_repo_config.yml"
local_repo_config_syntax_fail_msg: "Failed. Syntax errors present in local_repo_config.yml. Fix errors and re-run playbook again."

# Usage: include_high_availability_config.yml
omnia_metadata_file: "/opt/omnia/.data/oim_metadata.yml"
high_availability_config_path: "{{ hostvars['localhost']['input_project_dir'] }}/high_availability_config.yml"
high_availability_config_syntax_fail_msg: "Failed. Syntax errors present in high_availability_config.yml. Fix errors and re-run playbook again."
nfs_not_configured: "When enabling OIM HA or K8s Service Cluster an NFS external server must be configured.
  Please run the oim_cleanup.yml in utils and re-run the omnia_startup.sh script using the NFS(external) option."
ha_nfs_error_msg: |
  ERROR: Internal NFS is not supported with HA OIM or Service HA.
  Please configure External NFS for HA capabilities.

# Usage: check_service_role.yml
functional_groups_config_path: "/opt/omnia/.data/functional_groups_config.yml"
functional_groups_config_syntax_fail_msg: "Failed. Syntax errors present in functional_groups_config.yml. Fix errors and re-run playbook again."

# Usage: check_idrac_telemetry_support.yml
telemetry_config_file: "telemetry_config.yml"
fail_msg_telemetry_config_file: "telemetry_config.yml file doesn't exist in the input folder."
telemetry_config_syntax_fail_msg: "Failed. Syntax errors present in telemetry_config.yml. Fix errors and re-run playbook again. Common syntax Errors:"


================================================
FILE: telemetry/ansible.cfg
================================================
[defaults]
log_path = /opt/omnia/log/core/playbooks/telemetry.log
remote_tmp = /opt/omnia/tmp/.ansible/tmp/
host_key_checking = false
forks = 5
timeout = 180
executable = /bin/bash
library = ../common/library/modules
module_utils = ../common/library/module_utils

[persistent_connection]
command_timeout = 180
connect_timeout = 180

[ssh_connection]
retries = 3
ssh_args = -o ControlMaster=auto -o ControlPersist=60 -o ConnectTimeout=60


================================================
FILE: telemetry/roles/idrac_telemetry/tasks/create_telemetry_report.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Create and update telemetry report from template
  ansible.builtin.template:
    src: "{{ telemetry_report_template }}"
    dest: >-
      {{ telemetry_report_path }}
    mode: "{{ filemode }}"
    force: true
  delegate_to: localhost

- name: Telemetry Report Overview
  ansible.builtin.debug:
    msg: "{{ telemetry_report.splitlines() }}"
  when:
    - hostvars['localhost']['idrac_telemetry_support']


================================================
FILE: telemetry/roles/idrac_telemetry/tasks/initiate_telemetry_service_cluster.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# Include and initialize variables

- name: Set server host
  ansible.builtin.set_fact:
    node_host: >-
      {{ hostvars[inventory_hostname]['inventory_hostname'] }}

- name: Initialize variables
  ansible.builtin.set_fact:
    telemetry_idrac: []
    service_type: 3
    auth_type: 1
    idrac_ip_count: 0
    telemetry_idrac_count: 0
    failed_idrac_count: 0
    failed_idrac: []

- name: Include telemetry common vars
  ansible.builtin.include_vars: "{{ playbook_dir }}/roles/telemetry_validation/vars/main.yml"
  no_log: true

- name: Include Service k8s telemetry common vars
  ansible.builtin.include_vars: "{{ playbook_dir }}/roles/service_k8s_telemetry/vars/main.yml"
  no_log: true

- name: Fetch iDRAC BMC IPs for each pod
  fetch_idrac_ips:
    service_cluster_metadata: "{{ service_cluster_metadata }}"
    parent_to_bmc_ip_details: "{{ hostvars['localhost']['bmc_ips'] }}"
  register: idrac_podname_idracips

- name: Show iDRAC IPs for each pod
  ansible.builtin.debug:
    msg: >-
      "iDRAC IPs for pod '{{ item.key }}': {{ item.value | join(', ') }}"
    verbosity: 2
  loop: "{{ idrac_podname_idracips.idrac_podname_ips | dict2items }}"
  when: idrac_podname_idracips.idrac_podname_ips is defined and idrac_podname_idracips.idrac_podname_ips

- name: Read the existing BMC IP's from mysqlDB of the idrac telemetry pods
  block:
    - name: Read the existing BMC IP's from mysqlDB
      read_idracips_from_mysqldb:
        telemetry_namespace: "{{ telemetry_namespace }}"
        idrac_podnames: "{{ idrac_podname_idracips.idrac_podname_ips.keys() | list }}"
        mysqldb_k8s_name: "{{ mysqldb_k8s_name }}"
        mysqldb_name: "{{ mysqldb_name }}"
        mysqldb_user: "{{ hostvars['localhost']['mysqldb_user'] }}"
        mysqldb_password: "{{ hostvars['localhost']['mysqldb_password'] }}"
        db_retries: "{{ db_retries }}"
        db_delay: "{{ db_delay }}"
      register: existing_mysqldb_idracips
  rescue:
    - name: Failed to connect mysqldb
      ansible.builtin.fail:
        msg: "{{ mysqldb_insert_fail_msg }}"

- name: Set existing BMC IPs from mysqlDB
  ansible.builtin.set_fact:
    db_idrac_ip_list: "{{ existing_mysqldb_idracips.mysqldb_idrac_ips }}"
    existing_pod_to_db_idrac_ips: "{{ existing_mysqldb_idracips.pod_to_db_idrac_ips }}"

- name: Set fact for bmc_ips
  ansible.builtin.set_fact:
    bmc_ips: "{{ hostvars['localhost']['bmc_ips'].values() | flatten }}"

- name: Generate filtered iDRAC IP list
  ansible.builtin.set_fact:
    filtered_bmc_ip_list: "{{ bmc_ips | difference(db_idrac_ip_list) }}"

- name: Show filtered BMC IPs
  ansible.builtin.debug:
    msg: "Filtered BMC IPs: {{ filtered_bmc_ip_list }}"

- name: Remove deleted nodes from telemetry (nodes not in bmc_data.csv)
  ansible.builtin.include_tasks: remove_deleted_nodes.yml

- name: Convert filtered_bmc_ip_list to a dictionary with bmc_ip
  ansible.builtin.set_fact:
    filtered_bmc_ip_dict_list: "{{ filtered_bmc_ip_list | map('community.general.dict_kv', 'bmc_ip') | list }}"

- name: Validate BMC reachability
  ansible.builtin.include_tasks: validate_bmcips_reachability.yml

- name: Add iDRAC details in mysqldb
  when: telemetry_idrac is defined and (telemetry_idrac | length > 0)
  block:
    - name: Insert the valid iDRAC IPs into mysqldb
      insert_idracips_mysqldb:
        telemetry_namespace: "{{ telemetry_namespace }}"
        idrac_podnames_ips: "{{ idrac_podname_idracips.idrac_podname_ips }}"
        mysqldb_k8s_name: "{{ mysqldb_k8s_name }}"
        mysqldb_name: "{{ mysqldb_name }}"
        mysql_user: "{{ hostvars['localhost']['mysqldb_user'] }}"
        mysqldb_password: "{{ hostvars['localhost']['mysqldb_password'] }}"
        bmc_username: "{{ hostvars['localhost']['bmc_username'] }}"
        bmc_password: "{{ hostvars['localhost']['bmc_password'] }}"
        telemetry_idrac: "{{ telemetry_idrac }}"
        service_type: "{{ service_type }}"
        auth_type: "{{ auth_type }}"
        db_retries: "{{ db_retries }}"
        db_delay: "{{ db_delay }}"
      register: add_idrac_to_db
  rescue:
    - name: Failed to connect mysqldb
      ansible.builtin.fail:
        msg: "{{ mysqldb_insert_fail_msg }}"

- name: Show iDRACs added to mysqldb
  ansible.builtin.debug:
    msg: >-
      iDRACs added to mysqldb: {{ add_idrac_to_db.inserted_ips | default('No results returned') }}

- name: Show iDRACs failed to add to mysqldb
  ansible.builtin.debug:
    msg: >-
      "iDRACs failed to add to mysqldb: {{ add_idrac_to_db.failed_ips | default('No failed IPs') }}"

- name: Trigger rolling restart of StatefulSet idrac_telemetry
  when:
    - telemetry_idrac is defined
    - telemetry_idrac | length > 0
  block:
    - name: Restart idrac telemetry StatefulSet
      kubernetes.core.k8s:
        state: present
        definition:
          apiVersion: apps/v1
          kind: StatefulSet
          metadata:
            name: "{{ idrac_telemetry_k8s_name }}"
            namespace: "{{ telemetry_namespace }}"
          spec:
            template:
              metadata:
                annotations:
                  kubectl.kubernetes.io/restartedAt: "{{ lookup('pipe', 'date -u +%Y-%m-%dT%H:%M:%SZ') }}"
      register: restart_statefulset
  rescue:
    - name: StatefulSet restart failed
      ansible.builtin.fail:
        msg: "{{ idrac_telemetry_statefulset_restart_failure_msg.splitlines() | join(' ') }}"


================================================
FILE: telemetry/roles/idrac_telemetry/tasks/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Check if telemetry entry is present in software_config.json
  when: hostvars['localhost']['idrac_telemetry_support']
  block:
    - name: Collect iDRAC IP and initiate telemetry collection on service cluster
      ansible.builtin.include_tasks: initiate_telemetry_service_cluster.yml

    - name: Generete telemetry report
      ansible.builtin.include_tasks: create_telemetry_report.yml


================================================
FILE: telemetry/roles/idrac_telemetry/tasks/remove_deleted_nodes.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Identify iDRAC IPs to remove (present in DB but not in bmc_data.csv)
  ansible.builtin.set_fact:
    ips_to_remove: "{{ db_idrac_ip_list | difference(bmc_ips) }}"

- name: Show iDRAC IPs to be removed
  ansible.builtin.debug:
    msg: "iDRAC IPs to be removed: {{ ips_to_remove }}"
  when: ips_to_remove | length > 0

- name: Skip removal if no IPs to remove
  ansible.builtin.debug:
    msg: "{{ no_idracips_to_remove_msg }}"
  when: ips_to_remove | length == 0

- name: Disable telemetry on iDRAC nodes before removal
  when: ips_to_remove | length > 0
  block:
    - name: Disable telemetry service on iDRAC nodes
      disable_idrac_telemetry:
        idrac_ips: "{{ ips_to_remove }}"
        username: "{{ hostvars['localhost']['bmc_username'] }}"
        password: "{{ hostvars['localhost']['bmc_password'] }}"
        timeout: "{{ redfish_timeout }}"
      register: disable_telemetry_result
      ignore_errors: true

    - name: Show successfully disabled telemetry IPs
      ansible.builtin.debug:
        msg: "Successfully disabled telemetry on: {{ disable_telemetry_result.disabled_ips | default([]) }}"
      when:
        - disable_telemetry_result.disabled_ips is defined
        - disable_telemetry_result.disabled_ips | length > 0

    - name: Show failed to disable telemetry IPs
      ansible.builtin.debug:
        msg: "Failed to disable telemetry on: {{ disable_telemetry_result.failed_ips | default([]) }}"
      when:
        - disable_telemetry_result.failed_ips is defined
        - disable_telemetry_result.failed_ips | length > 0

- name: Remove iDRAC IPs from MySQL database
  when: ips_to_remove | length > 0
  block:
    - name: Delete iDRAC IPs from mysqldb
      delete_idracips_from_mysqldb:
        telemetry_namespace: "{{ telemetry_namespace }}"
        idrac_podnames: "{{ idrac_podname_idracips.idrac_podname_ips.keys() | list }}"
        mysqldb_k8s_name: "{{ mysqldb_k8s_name }}"
        mysqldb_name: "{{ mysqldb_name }}"
        mysqldb_user: "{{ hostvars['localhost']['mysqldb_user'] }}"
        mysqldb_password: "{{ hostvars['localhost']['mysqldb_password'] }}"
        ips_to_delete: "{{ ips_to_remove }}"
        pod_to_db_idrac_ips: "{{ existing_pod_to_db_idrac_ips }}"
        db_retries: "{{ db_retries }}"
        db_delay: "{{ db_delay }}"
      register: delete_idrac_result
  rescue:
    - name: Failed to delete iDRAC IPs from mysqldb
      ansible.builtin.fail:
        msg: "{{ mysqldb_delete_fail_msg }}"

- name: Show deleted iDRAC IPs
  ansible.builtin.debug:
    msg: "Successfully deleted iDRAC IPs from mysqldb: {{ delete_idrac_result.deleted_ips | default([]) }}"
  when:
    - ips_to_remove | length > 0
    - delete_idrac_result.deleted_ips is defined
    - delete_idrac_result.deleted_ips | length > 0

- name: Show failed to delete iDRAC IPs
  ansible.builtin.debug:
    msg: "Failed to delete iDRAC IPs from mysqldb: {{ delete_idrac_result.failed_ips | default([]) }}"
  when:
    - ips_to_remove | length > 0
    - delete_idrac_result.failed_ips is defined
    - delete_idrac_result.failed_ips | length > 0

- name: Update telemetry report variables with deletion info
  ansible.builtin.set_fact:
    deleted_idrac_count: "{{ delete_idrac_result.deleted_ips | default([]) | length }}"
    deleted_idrac_ips: "{{ delete_idrac_result.deleted_ips | default([]) }}"
    failed_delete_count: "{{ delete_idrac_result.failed_ips | default([]) | length }}"
    failed_delete_ips: "{{ delete_idrac_result.failed_ips | default([]) }}"
    disabled_telemetry_count: "{{ disable_telemetry_result.disabled_ips | default([]) | length }}"
    disabled_telemetry_ips: "{{ disable_telemetry_result.disabled_ips | default([]) }}"
  when: ips_to_remove | length > 0


================================================
FILE: telemetry/roles/idrac_telemetry/tasks/trigger_telemetry_collection.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# Restart iDRAC telemetry container
- name: Restart iDRAC telemetry container
  when:
    - hostvars['localhost']['idrac_telemetry_support']
    - hostvars['localhost']['telemetry_idrac'] is defined
    - hostvars['localhost']['telemetry_idrac'] | length > 0
  block:
    - name: Restart telemetry-collector
      containers.podman.podman_container:
        name: "{{ idrac_telemetry_container }}"
        state: started
        restart: true
  rescue:
    - name: Telemetry container restart failed
      ansible.builtin.fail:
        msg: "{{ idrac_telemetry_restart_failure_msg.splitlines() | join(' ') }}"


================================================
FILE: telemetry/roles/idrac_telemetry/tasks/validate_bmcips_reachability.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
- name: Validate BMC reachability
  update_bmc_group_entry:
    nodes: "{{ filtered_bmc_ip_dict_list }}"
    bmc_username: "{{ hostvars['localhost']['bmc_username'] }}"
    bmc_password: "{{ hostvars['localhost']['bmc_password'] }}"
    verify_bmc: true
  register: bmc_result

- name: Show verified BMC entries
  when: bmc_result.verified_bmc | length > 0
  ansible.builtin.debug:
    msg: "BMC entries valid for IPs: {{ bmc_result.verified_bmc | join(', ') }}"

- name: Show Redfish Disabled Warning
  when: bmc_result.redfish_disabled | length > 0
  ansible.builtin.debug:
    msg: "{{ redfish_disabled_msg | replace('\n', ' ') }}"

- name: Show Invalid BMC Credentials
  when: bmc_result.invalid_creds | length > 0
  ansible.builtin.debug:
    msg: "{{ invalid_creds_msg | replace('\n', ' ') }}"

- name: Show Unreachable BMC IPs
  when: bmc_result.unreachable_bmc | length > 0
  ansible.builtin.debug:
    msg: >-
      {{ unreachable_service_node_bmc_msg | replace('\n', ' ') }}

- name: Warning for user to fix BMC issues
  when: >
    (bmc_result.redfish_disabled | length > 0) or
    (bmc_result.invalid_creds | length > 0) or
    (bmc_result.unreachable_bmc | length > 0)
  ansible.builtin.pause:
    seconds: "{{ waiting_time_30 }}"
    prompt: "{{ invalid_bmc_warning_msg }}"

- name: Set fact for BMC IPs validation bmc bmc result
  ansible.builtin.set_fact:
    idrac_redfish_disabled: "{{ bmc_result.redfish_disabled }}"
    idrac_invalid_creds: "{{ bmc_result.invalid_creds }}"
    idrac_unreachable: "{{ bmc_result.unreachable_bmc }}"
    invalid_idrac_count: >-
      {{ (bmc_result.invalid_creds + bmc_result.unreachable_bmc + bmc_result.redfish_disabled) | length }}
    invalid_idrac_list: >-
      {{ bmc_result.invalid_creds + bmc_result.unreachable_bmc + bmc_result.redfish_disabled }}

- name: Filter iDRACs based on telemetry pre-requisites
  block:
    - name: Filter iDRACs matching telemetry pre-requisites (This task may take more time based on number of iDRACs)
      idrac_telemetry_filter:
        bmc_ip_list: "{{ bmc_result.verified_bmc }}"
        bmc_username: "{{ hostvars['localhost']['bmc_username'] }}"
        bmc_password: "{{ hostvars['localhost']['bmc_password'] }}"
        min_firmware_version_reqd: "{{ min_firmware_version_reqd }}"
      register: filter_idrac_output
      when:
        - bmc_result.verified_bmc is defined
        - bmc_result.verified_bmc | length > 0
  rescue:
    - name: Failed to filter iDRACs
      ansible.builtin.fail:
        msg: "{{ filter_idrac_fail_msg }} Error: {{ filter_idrac_output.msg }}"

- name: Update the telemetry variables with filtered iDRACs
  ansible.builtin.set_fact:
    telemetry_idrac: "{{ filter_idrac_output.telemetry_idrac }}"
    telemetry_idrac_count: "{{ filter_idrac_output.telemetry_idrac_count }}"
    failed_idrac_count: "{{ filter_idrac_output.failed_idrac_count }}"
    failed_idrac: "{{ filter_idrac_output.failed_idrac }}"
  when:
    - filter_idrac_output.telemetry_idrac is defined
    - filter_idrac_output.telemetry_idrac_count is defined

- name: Enable telemetry collection on iDRAC
  enable_telemetry_service:
    idrac_ips: "{{ telemetry_idrac }}"
    username: "{{ hostvars['localhost']['bmc_username'] }}"
    password: "{{ hostvars['localhost']['bmc_password'] }}"
  register: enable_telemetry_output

- name: Show Enable Telemetry Service Output
  ansible.builtin.debug:
    var: enable_telemetry_output
    verbosity: 2


================================================
FILE: telemetry/roles/idrac_telemetry/templates/telemetry_report.j2
================================================
===== Telemetry Summary Report =====

----- Telemetry Report for Cluster -----

Total IP count with Telemetry activated: {{ ((db_idrac_ip_list + telemetry_idrac) | difference(deleted_idrac_ips | default([]))) | length }}
Telemetry activated IPs List:
{% for item in (db_idrac_ip_list + telemetry_idrac) | difference(deleted_idrac_ips | default([])) %}
  - {{ item }}
{% endfor %}

Total IP count with Telemetry not supported: {{ failed_idrac_count | int + invalid_idrac_count | int }}
Telemetry not supported IPs List:
{% for item in failed_idrac + invalid_idrac_list %}
  - {{ item }}
{% endfor %}

{% if deleted_idrac_count is defined and deleted_idrac_count | int > 0 %}
----- Node Deletion Report -----

Total IP count removed from telemetry (not in bmc_data.csv): {{ deleted_idrac_count | int }}
Removed IPs List:
{% for item in deleted_idrac_ips %}
  - {{ item }}
{% endfor %}

{% if disabled_telemetry_count is defined and disabled_telemetry_count | int > 0 %}
IPs with telemetry disabled via Redfish: {{ disabled_telemetry_count | int }}
Disabled telemetry IPs List:
{% for item in disabled_telemetry_ips %}
  - {{ item }}
{% endfor %}
{% endif %}
{% endif %}

===== Telemetry Report End =====


================================================
FILE: telemetry/roles/idrac_telemetry/vars/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# Usage: initiate_telemetry.yml
python_version: "{{ ansible_python_interpreter }}"
mysqldb_name: "idrac_telemetrydb"
idrac_telemetry_scripting_folder: "{{ kube_client_share_path }}/iDRAC-Telemetry-Scripting"
mysqldb_insert_fail_msg: |
  Failed to add/get iDRAC credential details in the mysql database.
  This could be due to the tables in the mysqldb not being accessible at the moment. Please try running the playbook again after some time.
db_retries: 10
db_delay: 10
mysqldb_container_port: 3306
filemode: "0644"
mysqldb_host: "127.0.0.1"
min_firmware_version_reqd: 1
waiting_time_30: 30
idrac_telemetry_enable_fail_msg: |
  Failed. Error enabling telemetry on iDRAC. Possible causes include timeout or Redfish connectivity issues.
  Please retry the playbook after some time.
filter_idrac_fail_msg: |
  Failed. Error filtering iDRACs. Possible causes include timeout or Redfish connectivity issues.
  Please retry the playbook after some time.
bmc_group_data_filename: "/opt/omnia/telemetry/bmc_group_data.csv"
redfish_disabled_msg: |
  Redfish is disabled on the following BMC IPs: {{ bmc_result.redfish_disabled | join(', ') }}.
  Please enable Redfish on above BMC IPs and execute telemetry.yml.
invalid_creds_msg: |
  The following BMC IPs have invalid credentials: {{ bmc_result.invalid_creds | join(', ') }}.
  Kinldy make sure corect `bmc_username` and `bmc_password` is present in omnia_config_credential.yml file.
  And all nodes BMC credentials should be same.
  Rectify the issue and re-execute telemetry.yml.
unreachable_oim_bmc_msg: >
  The following BMC IPs are unreachable: {{ bmc_result.unreachable_bmc | join(', ') }}.
  Please provide BMC IPs which are reachable from OIM,
  else remove unreachable BMC entries from the {{ bmc_group_data_filename }} file.
unreachable_service_node_bmc_msg: >
  The following BMC IPs are unreachable: {{ bmc_result.unreachable_bmc | join(', ') }}.
  Please provide BMC IPs which are reachable from service node: {{ node_host }},
  else remove unreachable BMC entries from the {{ bmc_group_data_filename }} file.
invalid_bmc_warning_msg: |
  [WARNING] Some BMC IPs are not valid. Kindly address the issues mentioned above and execute telemetry.yml.
  Telemetry feature wont be enabled for these BMC IPs from {{ bmc_group_data_filename }} file.

# Usage: validate_bmcips_reachability.yml
idrac_telemetry_scripting_git_clone_path: "/opt/omnia/telemetry/idrac_telemetry/iDRAC-Telemetry-Scripting"

# Usage: trigger_telemetry_collection.yml
idrac_telemetry_container: "idrac_telemetry_receiver"
idrac_telemetry_receiver_entry_script: "/usr/local/bin/idrac_telemetry_receiver_init.sh"
idrac_telemetry_restart_failure_msg: |
  Failed to restart idrac_telemetry_receiver container. Please check the logs using the command `podman logs idrac_telemetry_receiver` and try again later.

idrac_telemetry_statefulset_restart_failure_msg: |
  Failed to restart the  {{ idrac_telemetry_k8s_name }} StatefulSet.
  Please check the logs using the command kubectl logs -n {{ telemetry_namespace }} {{ idrac_telemetry_k8s_name }}-<pod-index> and try again.

# Usage: remove_deleted_nodes.yml
redfish_timeout: 30
mysqldb_delete_fail_msg: |
  Failed to delete iDRAC IPs from the mysql database.
  This could be due to the tables in the mysqldb not being accessible at the moment. Please try running the playbook again after some time.
no_idracips_to_remove_msg: "No iDRAC IPs to remove. All DB entries are present in bmc_data.csv."

# Usage: create_telemetry_report.yml
telemetry_report_path: "/opt/omnia/telemetry/idrac_telemetry_report.yml"
telemetry_report_template: "telemetry_report.j2"
telemetry_report: |
      ---- Telemetry Report Overview ----

      IP count with Telemetry not supported: {{ failed_idrac_count | int + invalid_idrac_count | int }}
      IP count with Telemetry activated in current execution: {{ telemetry_idrac_count | int }}
      {% if deleted_idrac_count is defined %}
      IP count removed from telemetry (not in bmc_data.csv): {{ deleted_idrac_count | int }}
      {% endif %}

      {% if (failed_idrac_count | int + invalid_idrac_count | int) > 0 %}
      Potential reasons for telemetry not being initiated include Redfish connectivity problems, timeout issues,
      iDRAC datacenter license constraints, or firmware-related problems.
      {% endif %}
      {% if idrac_redfish_disabled | length > 0 %}
      IPs with Redfish disabled:
      {% for item in idrac_redfish_disabled %}
        - {{ item }}
      {% endfor %}
      {% endif %}
      {% if idrac_invalid_creds | length > 0 %}
      IPs with invalid credentials:
      {% for item in idrac_invalid_creds %}
        - {{ item }}
      {% endfor %}
      {% endif %}
      {% if idrac_unreachable | length > 0 %}
      IPs with unreachable BMC:
      {% for item in idrac_unreachable %}
        - {{ item }}
      {% endfor %}
      {% endif %}
      {% if failed_idrac | length > 0 %}
      Telemetry not supported because of iDRAC Datacenter license constraints or firmware issues.
      IPs List:
      {% for item in failed_idrac %}
        - {{ item }}
      {% endfor %}
      {% endif %}
      {% if deleted_idrac_ips is defined and deleted_idrac_ips | length > 0 %}
      IPs removed from telemetry database (not present in bmc_data.csv):
      {% for item in deleted_idrac_ips %}
        - {{ item }}
      {% endfor %}
      {% endif %}
      {% if disabled_telemetry_ips is defined and disabled_telemetry_ips | length > 0 %}
      IPs with telemetry disabled via Redfish:
      {% for item in disabled_telemetry_ips %}
        - {{ item }}
      {% endfor %}
      {% endif %}


================================================
FILE: telemetry/roles/service_k8s_telemetry/tasks/main.yml
================================================
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Deployment of k8s telemetry service
  when:
    - hostvars['localhost']['idrac_telemetry_support']
  block:
    - name: Update service cluster metadata
      ansible.builtin.include_tasks: update_metadata_file.yml


================================================
FILE: telemetry/roles/service_k8s_telemetry/tasks/update_metadata_file.yml
================================================
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Check if namespace exists
  kubernetes.core.k8s_info:
    api_version: v1
    kind: Namespace
    name: "{{ telemetry_namespace }}"
  register: ns_info

- name: Fail if namespace does not exist
  ansible.builtin.fail:
    msg: "{{ telemetry_namespace_not_found }}"
  when: ns_info.resources | length == 0

- name: Get StatefulSet details
  kubernetes.core.k8s_info:
    api_version: apps/v1
    kind: StatefulSet
    name: "{{ idrac_telemetry_k8s_name }}"
    namespace: "{{ telemetry_namespace }}"
  register: sts_info

- name: Fail if StatefulSet does not exist
  ansible.builtin.fail:
    msg: "{{ telemetry_deployments_not_found }}"
  when: sts_info.resources | length == 0

- name: Extract ready and expected replicas
  ansible.builtin.set_fact:
    sts_ready: "{{ sts_info.resources[0].status.readyReplicas | default(0) }}"
    sts_expected: "{{ sts_info.resources[0].spec.replicas | default(0) }}"

- name: Fail if not all replicas are ready
  ansible.builtin.fail:
    msg: "{{ telemetry_ready_replicas_failure_msg }}"
  when: sts_ready != sts_expected

- name: Include service_cluster metadata if already exists
  ansible.builtin.include_vars: "{{ service_cluster_metadata_path }}"
  delegate_to: localhost
  connection: local
  no_log: true
  failed_when: false

- name: Set idrac-telemetry replica count
  ansible.builtin.set_fact:
    idrac_telemetry_replicas: >-
      {{
        service_cluster_metadata
        | dict2items
        | selectattr('value.parent_status', 'defined')
        | selectattr('value.parent_status', 'equalto', true)
        | selectattr('value.child_groups', 'defined')
        | selectattr('value.role', 'defined')
        | selectattr('value.role', 'search', 'service_kube_node')
        | list
        | length
      }}

- name: Scale idrac-telemetry StatefulSet using JSON patch
  kubernetes.core.k8s_json_patch:
    api_version: apps/v1
    kind: StatefulSet
    name: idrac-telemetry
    namespace: telemetry
    patch: |
      [
        {
          "op": "replace",
          "path": "/spec/replicas",
          "value": {{ (idrac_telemetry_replicas | int) + 1 }}
        }
      ]

- name: Generating iDRAC telemetry pods names
  ansible.builtin.set_fact:
    idrac_telemetry_pods: >-
      {{
        range(1, (idrac_telemetry_replicas | int) + 1)
        | map('regex_replace', '^', idrac_telemetry_k8s_name ~ '-')
        | list
      }}

- name: Assign iDRAC telemetry pod to MGMT_node
  ansible.builtin.set_fact:
    service_cluster_metadata: >-
      {{
        service_cluster_metadata | combine({
          'MGMT_node': service_cluster_metadata['MGMT_node']
          | combine({
              'idrac_podname': idrac_telemetry_k8s_name ~ '-0'
          })
        }, recursive=True)
      }}

- name: Wait for each iDRAC telemetry pod to be ready
  ansible.builtin.command: >
    kubectl wait --for=condition=ready pod/{{ item }}
    -n {{ telemetry_namespace }} --timeout={{ pod_wait_timeout }}
  loop: "{{ idrac_telemetry_pods }}"
  changed_when: false

- name: Get service cluster node details
  ansible.builtin.set_fact:
    kube_compute_nodes: >-
      {{ service_cluster_metadata | dict2items
         | selectattr('value.parent_status', 'defined')
         | selectattr('value.parent_status', 'equalto', true)
         | selectattr("value.role", "defined")
         | selectattr("value.role", "search", "^service_kube_node")
         | sort(attribute="key") | list }}

- name: Identify unassigned service nodes and idrac-telemetry pods
  ansible.builtin.set_fact:
    unassigned_compute_nodes: >-
      {{
        (kube_compute_nodes
         | rejectattr('value.idrac_podname', 'defined')
         | list)
      }}
    assigned_pods: >-
      {{
        kube_compute_nodes
        | map(attribute='value.idrac_podname')
        | select('defined')
        | list
        | default([])
      }}

- name: Identify unassigned telemetry pods
  ansible.builtin.set_fact:
    unassigned_pods: >-
      {{ idrac_telemetry_pods | reject('in', assigned_pods) | list }}

- name: Build new pod assignments for unassigned nodes
  ansible.builtin.set_fact:
    new_metadata_items: "{{ new_metadata_items | default([]) + [
        {
          item.0.key: item.0.value | combine({ 'idrac_podname': item.1 })
        }
      ] }}"
  loop: "{{ unassigned_compute_nodes | zip(unassigned_pods) | list }}"

- name: Append new pod details in service_cluster metadata
  ansible.builtin.set_fact:
    service_cluster_metadata: "{{ service_cluster_metadata | combine(new_metadata_items | default([]) | combine, recursive=True) }}"


- name: Update service_cluster metadata file
  ansible.builtin.copy:
    content: "{{ {'kube_client_share_path': kube_client_share_path, 'kube_vip': kube_vip, 'service_cluster_metadata': service_cluster_metadata} | to_nice_yaml }}" # noqa: yaml[line-length]
    dest: "{{ service_cluster_metadata_path }}"
    force: true
    mode: "{{ metadata_perm }}"
  delegate_to: localhost
  connection: local
  no_log: true


================================================
FILE: telemetry/roles/service_k8s_telemetry/vars/main.yml
================================================
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# Usage: idrac_telemetry_deployment.yml
telemetry_namespace: "telemetry"
idrac_telemetry_k8s_name: idrac-telemetry
mysqldb_k8s_name: mysqldb
mysqldb_name: "idrac_telemetrydb"
mysqldb_container_port1: 3306
functional_groups_config_path: "/opt/omnia/.data/functional_groups_config.yml"
functional_groups_config_syntax_fail_msg: "Failed. Syntax errors present in functional_groups_config.yml. Fix errors and re-run playbook again."
service_cluster_metadata_path: "/opt/omnia/.data/service_cluster_metadata.yml"
metadata_perm: "0644"
telemetry_ready_replicas_failure_msg: >
  "Failed. Telemetry deployment is not fully operational. Expected {{ sts_expected }} components to be ready, but only {{ sts_ready }} are available.
  Please verify the telemetry deployment status and execute telemetry playbook again."
telemetry_deployments_not_found: >
  "Failed. Telemetry deployments not found in namespace {{ telemetry_namespace }}.
  Please verify the telemetry deployment status and execute telemetry playbook again."
telemetry_namespace_not_found: >
  "Failed. Telmetry namespace does not exist.
  Please verify the telemetry deployment status and execute telemetry playbook again."
pod_wait_timeout: "10m"


================================================
FILE: telemetry/roles/telemetry_validation/files/timezone.txt
================================================
Africa/Abidjan
Africa/Accra
Africa/Addis_Ababa
Africa/Algiers
Africa/Asmara
Africa/Asmera
Africa/Bamako
Africa/Bangui
Africa/Banjul
Africa/Bissau
Africa/Blantyre
Africa/Brazzaville
Africa/Bujumbura
Africa/Cairo
Africa/Casablanca
Africa/Ceuta
Africa/Conakry
Africa/Dakar
Africa/Dar_es_Salaam
Africa/Djibouti
Africa/Douala
Africa/El_Aaiun
Africa/Freetown
Africa/Gaborone
Africa/Harare
Africa/Johannesburg
Africa/Juba
Africa/Kampala
Africa/Khartoum
Africa/Kigali
Africa/Kinshasa
Africa/Lagos
Africa/Libreville
Africa/Lome
Africa/Luanda
Africa/Lubumbashi
Africa/Lusaka
Africa/Malabo
Africa/Maputo
Africa/Maseru
Africa/Mbabane
Africa/Mogadishu
Africa/Monrovia
Africa/Nairobi
Africa/Ndjamena
Africa/Niamey
Africa/Nouakchott
Africa/Ouagadougou
Africa/Porto-Novo
Africa/Sao_Tome
Africa/Timbuktu
Africa/Tripoli
Africa/Tunis
Africa/Windhoek
America/Adak
America/Anchorage
America/Anguilla
America/Antigua
America/Araguaina
America/Argentina/Buenos_Aires
America/Argentina/Catamarca
America/Argentina/ComodRivadavia
America/Argentina/Cordoba
America/Argentina/Jujuy
America/Argentina/La_Rioja
America/Argentina/Mendoza
America/Argentina/Rio_Gallegos
America/Argentina/Salta
America/Argentina/San_Juan
America/Argentina/San_Luis
America/Argentina/Tucuman
America/Argentina/Ushuaia
America/Aruba
America/Asuncion
America/Atikokan
America/Atka
America/Bahia
America/Bahia_Banderas
America/Barbados
America/Belem
America/Belize
America/Blanc-Sablon
America/Boa_Vista
America/Bogota
America/Boise
America/Buenos_Aires
America/Cambridge_Bay
America/Campo_Grande
America/Cancun
America/Caracas
America/Catamarca
America/Cayenne
America/Cayman
America/Chicago
America/Chihuahua
America/Coral_Harbour
America/Cordoba
America/Costa_Rica
America/Creston
America/Cuiaba
America/Curacao
America/Danmarkshavn
America/Dawson
America/Dawson_Creek
America/Denver
America/Detroit
America/Dominica
America/Edmonton
America/Eirunepe
America/El_Salvador
America/Ensenada
America/Fort_Nelson
America/Fort_Wayne
America/Fortaleza
America/Glace_Bay
America/Godthab
America/Goose_Bay
America/Grand_Turk
America/Grenada
America/Guadeloupe
America/Guatemala
America/Guayaquil
America/Guyana
America/Halifax
America/Havana
America/Hermosillo
America/Indiana/Indianapolis
America/Indiana/Knox
America/Indiana/Marengo
America/Indiana/Petersburg
America/Indiana/Tell_City
America/Indiana/Vevay
America/Indiana/Vincennes
America/Indiana/Winamac
America/Indianapolis
America/Inuvik
America/Iqaluit
America/Jamaica
America/Jujuy
America/Juneau
America/Kentucky/Louisville
America/Kentucky/Monticello
America/Knox_IN
America/Kralendijk
America/La_Paz
America/Lima
America/Los_Angeles
America/Louisville
America/Lower_Princes
America/Maceio
America/Managua
America/Manaus
America/Marigot
America/Martinique
America/Matamoros
America/Mazatlan
America/Mendoza
America/Menominee
America/Merida
America/Metlakatla
America/Mexico_City
America/Miquelon
America/Moncton
America/Monterrey
America/Montevideo
America/Montreal
America/Montserrat
America/Nassau
America/New_York
America/Nipigon
America/Nome
America/Noronha
America/North_Dakota/Beulah
America/North_Dakota/Center
America/North_Dakota/New_Salem
America/Nuuk
America/Ojinaga
America/Panama
America/Pangnirtung
America/Paramaribo
America/Phoenix
America/Port-au-Prince
America/Port_of_Spain
America/Porto_Acre
America/Porto_Velho
America/Puerto_Rico
America/Punta_Arenas
America/Rainy_River
America/Rankin_Inlet
America/Recife
America/Regina
America/Resolute
America/Rio_Branco
America/Rosario
America/Santa_Isabel
America/Santarem
America/Santiago
America/Santo_Domingo
America/Sao_Paulo
America/Scoresbysund
America/Shiprock
America/Sitka
America/St_Barthelemy
America/St_Johns
America/St_Kitts
America/St_Lucia
America/St_Thomas
America/St_Vincent
America/Swift_Current
America/Tegucigalpa
America/Thule
America/Thunder_Bay
America/Tijuana
America/Toronto
America/Tortola
America/Vancouver
America/Virgin
America/Whitehorse
America/Winnipeg
America/Yakutat
America/Yellowknife
Antarctica/Casey
Antarctica/Davis
Antarctica/DumontDUrville
Antarctica/Macquarie
Antarctica/Mawson
Antarctica/McMurdo
Antarctica/Palmer
Antarctica/Rothera
Antarctica/South_Pole
Antarctica/Syowa
Antarctica/Troll
Antarctica/Vostok
Arctic/Longyearbyen
Asia/Aden
Asia/Almaty
Asia/Amman
Asia/Anadyr
Asia/Aqtau
Asia/Aqtobe
Asia/Ashgabat
Asia/Ashkhabad
Asia/Atyrau
Asia/Baghdad
Asia/Bahrain
Asia/Baku
Asia/Bangkok
Asia/Barnaul
Asia/Beirut
Asia/Bishkek
Asia/Brunei
Asia/Calcutta
Asia/Chita
Asia/Choibalsan
Asia/Chongqing
Asia/Chungking
Asia/Colombo
Asia/Dacca
Asia/Damascus
Asia/Dhaka
Asia/Dili
Asia/Dubai
Asia/Dushanbe
Asia/Famagusta
Asia/Gaza
Asia/Harbin
Asia/Hebron
Asia/Ho_Chi_Minh
Asia/Hong_Kong
Asia/Hovd
Asia/Irkutsk
Asia/Istanbul
Asia/Jakarta
Asia/Jayapura
Asia/Jerusalem
Asia/Kabul
Asia/Kamchatka
Asia/Karachi
Asia/Kashgar
Asia/Kathmandu
Asia/Katmandu
Asia/Khandyga
Asia/Kolkata
Asia/Krasnoyarsk
Asia/Kuala_Lumpur
Asia/Kuching
Asia/Kuwait
Asia/Macao
Asia/Macau
Asia/Magadan
Asia/Makassar
Asia/Manila
Asia/Muscat
Asia/Nicosia
Asia/Novokuznetsk
Asia/Novosibirsk
Asia/Omsk
Asia/Oral
Asia/Phnom_Penh
Asia/Pontianak
Asia/Pyongyang
Asia/Qatar
Asia/Qostanay
Asia/Qyzylorda
Asia/Rangoon
Asia/Riyadh
Asia/Saigon
Asia/Sakhalin
Asia/Samarkand
Asia/Seoul
Asia/Shanghai
Asia/Singapore
Asia/Srednekolymsk
Asia/Taipei
Asia/Tashkent
Asia/Tbilisi
Asia/Tehran
Asia/Tel_Aviv
Asia/Thimbu
Asia/Thimphu
Asia/Tokyo
Asia/Tomsk
Asia/Ujung_Pandang
Asia/Ulaanbaatar
Asia/Ulan_Bator
Asia/Urumqi
Asia/Ust-Nera
Asia/Vientiane
Asia/Vladivostok
Asia/Yakutsk
Asia/Yangon
Asia/Yekaterinburg
Asia/Yerevan
Atlantic/Azores
Atlantic/Bermuda
Atlantic/Canary
Atlantic/Cape_Verde
Atlantic/Faeroe
Atlantic/Faroe
Atlantic/Jan_Mayen
Atlantic/Madeira
Atlantic/Reykjavik
Atlantic/South_Georgia
Atlantic/St_Helena
Atlantic/Stanley
Australia/ACT
Australia/Adelaide
Australia/Brisbane
Australia/Broken_Hill
Australia/Canberra
Australia/Currie
Australia/Darwin
Australia/Eucla
Australia/Hobart
Australia/LHI
Australia/Lindeman
Australia/Lord_Howe
Australia/Melbourne
Australia/NSW
Australia/North
Australia/Perth
Australia/Queensland
Australia/South
Australia/Sydney
Australia/Tasmania
Australia/Victoria
Australia/West
Australia/Yancowinna
Brazil/Acre
Brazil/DeNoronha
Brazil/East
Brazil/West
CET
CST6CDT
Canada/Atlantic
Canada/Central
Canada/Eastern
Canada/Mountain
Canada/Newfoundland
Canada/Pacific
Canada/Saskatchewan
Canada/Yukon
Chile/Continental
Chile/EasterIsland
Cuba
EET
EST
EST5EDT
Egypt
Eire
Etc/GMT
Etc/GMT+0
Etc/GMT+1
Etc/GMT+10
Etc/GMT+11
Etc/GMT+12
Etc/GMT+2
Etc/GMT+3
Etc/GMT+4
Etc/GMT+5
Etc/GMT+6
Etc/GMT+7
Etc/GMT+8
Etc/GMT+9
Etc/GMT-0
Etc/GMT-1
Etc/GMT-10
Etc/GMT-11
Etc/GMT-12
Etc/GMT-13
Etc/GMT-14
Etc/GMT-2
Etc/GMT-3
Etc/GMT-4
Etc/GMT-5
Etc/GMT-6
Etc/GMT-7
Etc/GMT-8
Etc/GMT-9
Etc/GMT0
Etc/Greenwich
Etc/UCT
Etc/UTC
Etc/Universal
Etc/Zulu
Europe/Amsterdam
Europe/Andorra
Europe/Astrakhan
Europe/Athens
Europe/Belfast
Europe/Belgrade
Europe/Berlin
Europe/Bratislava
Europe/Brussels
Europe/Bucharest
Europe/Budapest
Europe/Busingen
Europe/Chisinau
Europe/Copenhagen
Europe/Dublin
Europe/Gibraltar
Europe/Guernsey
Europe/Helsinki
Europe/Isle_of_Man
Europe/Istanbul
Europe/Jersey
Europe/Kaliningrad
Europe/Kiev
Europe/Kirov
Europe/Lisbon
Europe/Ljubljana
Europe/London
Europe/Luxembourg
Europe/Madrid
Europe/Malta
Europe/Mariehamn
Europe/Minsk
Europe/Monaco
Europe/Moscow
Europe/Nicosia
Europe/Oslo
Europe/Paris
Europe/Podgorica
Europe/Prague
Europe/Riga
Europe/Rome
Europe/Samara
Europe/San_Marino
Europe/Sarajevo
Europe/Saratov
Europe/Simferopol
Europe/Skopje
Europe/Sofia
Europe/Stockholm
Europe/Tallinn
Europe/Tirane
Europe/Tiraspol
Europe/Ulyanovsk
Europe/Uzhgorod
Europe/Vaduz
Europe/Vatican
Europe/Vienna
Europe/Vilnius
Europe/Volgograd
Europe/Warsaw
Europe/Zagreb
Europe/Zaporozhye
Europe/Zurich
GB
GB-Eire
GMT
GMT+0
GMT-0
GMT0
Greenwich
HST
Hongkong
Iceland
Indian/Antananarivo
Indian/Chagos
Indian/Christmas
Indian/Cocos
Indian/Comoro
Indian/Kerguelen
Indian/Mahe
Indian/Maldives
Indian/Mauritius
Indian/Mayotte
Indian/Reunion
Iran
Israel
Jamaica
Japan
Kwajalein
Libya
MET
MST
MST7MDT
Mexico/BajaNorte
Mexico/BajaSur
Mexico/General
NZ
NZ-CHAT
Navajo
PRC
PST8PDT
Pacific/Apia
Pacific/Auckland
Pacific/Bougainville
Pacific/Chatham
Pacific/Chuuk
Pacific/Easter
Pacific/Efate
Pacific/Enderbury
Pacific/Fakaofo
Pacific/Fiji
Pacific/Funafuti
Pacific/Galapagos
Pacific/Gambier
Pacific/Guadalcanal
Pacific/Guam
Pacific/Honolulu
Pacific/Johnston
Pacific/Kiritimati
Pacific/Kosrae
Pacific/Kwajalein
Pacific/Majuro
Pacific/Marquesas
Pacific/Midway
Pacific/Nauru
Pacific/Niue
Pacific/Norfolk
Pacific/Noumea
Pacific/Pago_Pago
Pacific/Palau
Pacific/Pitcairn
Pacific/Pohnpei
Pacific/Ponape
Pacific/Port_Moresby
Pacific/Rarotonga
Pacific/Saipan
Pacific/Samoa
Pacific/Tahiti
Pacific/Tarawa
Pacific/Tongatapu
Pacific/Truk
Pacific/Wake
Pacific/Wallis
Pacific/Yap
Poland
Portugal
ROC
ROK
Singapore
Turkey
UCT
US/Alaska
US/Aleutian
US/Arizona
US/Central
US/East-Indiana
US/Eastern
US/Hawaii
US/Indiana-Starke
US/Michigan
US/Mountain
US/Pacific
US/Samoa
UTC
Universal
W-SU
WET
Zulu


================================================
FILE: telemetry/roles/telemetry_validation/tasks/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Initialize variables
  ansible.builtin.set_fact:
    telemetry_validation_status: true

- name: Validate telemetry_config.yml
  ansible.builtin.include_tasks: validate_telemetry_config.yml

- name: Validate iDRAC inventory
  ansible.builtin.include_tasks: validate_idrac_inventory.yml
  when: idrac_telemetry_support


================================================
FILE: telemetry/roles/telemetry_validation/tasks/validate_idrac_inventory.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Validate BMC group data file exists
  ansible.builtin.stat:
    path: "{{ bmc_group_data_filename }}"
  register: bmc_group_data_stat

- name: Fail if BMC group data file does not exist
  ansible.builtin.fail:
    msg: "{{ bmc_group_data_file_not_found_msg }}"
  when: not bmc_group_data_stat.stat.exists

- name: Check if service cluster metadata file exists
  ansible.builtin.stat:
    path: "{{ service_cluster_metadata_path }}"
  register: service_cluster_metadata_stat

- name: Fail if service cluster metadata file is missing
  ansible.builtin.fail:
    msg: "{{ service_cluster_md_not_found_msg }}"
  when: not service_cluster_metadata_stat.stat.exists

- name: Include service_cluster metadata
  ansible.builtin.include_vars:
    file: "{{ service_cluster_metadata_path }}"
  no_log: true
  when: service_cluster_metadata_stat.stat.exists

- name: Read BMC group data
  ansible.builtin.set_fact:
    bmc_group_data: "{{ lookup('file', bmc_group_data_filename).splitlines() }}"

- name: Include OCHAMI node list
  ansible.builtin.include_vars: "{{ openchami_nodes_vars_path }}"

- name: Validate BMC group data file
  validate_bmc_group_data:
    nodes_bmc_ips: "{{ nodes | map(attribute='bmc_ip') | list }}"
    bmc_group_data_headers: "{{ bmc_group_data_headers }}"
    bmc_group_data: "{{ bmc_group_data }}"
    bmc_group_data_file: "{{ bmc_group_data_filename }}"
  register: bmc_ip_data

- name: Set validated BMC ips
  ansible.builtin.set_fact:
    bmc_dict_list: "{{ bmc_ip_data.bmc_dict_list }}"
    bmc_ips: "{{ bmc_ip_data.bmc_ips }}"

- name: Add service_kube_cp host
  ansible.builtin.add_host:
    name: service_kube_cp
    ansible_host: "{{ kube_vip }}"
    groups: service_kube_cp_group


================================================
FILE: telemetry/roles/telemetry_validation/tasks/validate_telemetry_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# Include telemetry_config_file.yml
- name: Check that the telemetry_config.yml exists
  ansible.builtin.stat:
    path: "{{ telemetry_config_file }}"
  register: stat_result

- name: Fail if telemetry_config.yml file doesn't exist
  ansible.builtin.fail:
    msg: "{{ fail_msg_telemetry_config_file }}"
  when: not stat_result.stat.exists

- name: Include variable file telemetry_config.yml
  block:
    - name: Include variable file telemetry_config.yml
      ansible.builtin.include_vars: "{{ telemetry_config_file }}"
      register: include_telemetry_config
      no_log: true
  rescue:
    - name: Failed to include telemetry_config.yml
      ansible.builtin.fail:
        msg: "{{ telemetry_config_syntax_fail_msg }} Possible Syntax Error Hints: {{ include_telemetry_config.message }}"

- name: Include metadata vars
  ansible.builtin.include_vars: "{{ omnia_metadata_file }}"
  register: include_metadata
  no_log: true

- name: Set support values
  ansible.builtin.set_fact:
    idrac_telemetry_support: "{{ idrac_telemetry_support | lower }}"

- name: Warning for idrac_telemetry_support is currently set to false
  ansible.builtin.pause:
    seconds: "{{ pause_time_15 }}"
    prompt: "{{ warning_idrac_telemetry_support_false }}"
  when: not idrac_telemetry_support

- name: Warning for idrac_telemetry_support is currently set to true
  ansible.builtin.pause:
    seconds: "{{ pause_time_15 }}"
    prompt: "{{ warning_idrac_telemetry_support_true }}"
  when: idrac_telemetry_support


================================================
FILE: telemetry/roles/telemetry_validation/tasks/validation_status_check.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Set telemetry_validation_status
  ansible.builtin.set_fact:
    telemetry_validation_status: false
  when: telemetry_validation_status is not defined

- name: Validate telemetry parameters
  ansible.builtin.include_role:
    name: "{{ role_path }}"
  when: not telemetry_validation_status


================================================
FILE: telemetry/roles/telemetry_validation/vars/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# Usage: validate_telemetry_config.yml
omnia_metadata_file: "/opt/omnia/.data/oim_metadata.yml"
telemetry_config_file: "{{ input_project_dir }}/telemetry_config.yml"
fail_msg_telemetry_config_file: "telemetry_config.yml file doesn't exist."
pause_time_15: 15
bmc_group_data_filename: "/opt/omnia/telemetry/bmc_group_data.csv"
warning_telemetry_support_false: |
  "[WARNING] idrac_telemetry_support are false in telemetry_config.yml.
  Omnia does not deploy telemetry feature if none of the support category is true."
warning_bmc_group_data_file_not_updated_msg: |
  "[WARNING] The following BMC IPs are missing from {{ bmc_group_data_filename }}:
  {{ missing_bmc_ips | join('\n') }}
  If telemetry collection required for missing IPs then re-run the playbook."
telemetry_config_syntax_fail_msg: "Failed. Syntax errors present in telemetry_config.yml. Fix errors and re-run playbook again."
warning_idrac_telemetry_support_false: |
  "[WARNING] idrac_telemetry_support is set to false in telemetry_config.yml. This means iDRAC telemetry will not be activated.
  To use telemetry, set idrac_telemetry_support to true in telemetry_config.yml.
  Note that Omnia does not support disabling telemetry if containers are already running.
  To remove telemetry containers, use the utils/oim_cleanup.yml playbook."
warning_idrac_telemetry_support_true: |
  "[WARNING] idrac_telemetry_support is set to true in telemetry_config.yml.
  iDRAC telemetry will be activated for all BMC IPs listed in {{ bmc_group_data_filename }}.
  Confirm that all BMC IPs are reachable from the OIM and respective service cluster nodes for telemetry to function properly.
  Make sure that Redfish is enabled and the iDRAC has a datacenter license.
  Also, ensure that the firmware version is greater than 4 for iDRAC9 or greater than 1 for iDRAC10."

# Usage: validate_idrac_inventory.yml
service_cluster_md_not_found_msg: >
  Service cluster metadata file '{{ service_cluster_metadata_path }}' does not exist.
  Please execute discovery first to generate the metadata file and set up telemetry in the service cluster.
bmc_group_data_file_not_found_msg: "Failed. The BMC data file: {{ bmc_group_data_filename }} does not exist.
 Please execute discovery_provision.yml to Generate BMC data file."
bmc_group_data_headers: "BMC_IP,GROUP_NAME,PARENT"
openchami_work_dir: "/opt/omnia/openchami/workdir"
nodes_dir: "{{ openchami_work_dir }}/nodes"
openchami_nodes_vars_path: "{{ nodes_dir }}/nodes.yaml"
service_cluster_metadata_path: "/opt/omnia/.data/service_cluster_metadata.yml"


================================================
FILE: telemetry/telemetry.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Set_fact for fetch omnia config credentials
  hosts: localhost
  connection: local
  tasks:
    - name: Set dynamic run tags including 'telemetry'
      ansible.builtin.set_fact:
        omnia_run_tags: "{{ (ansible_run_tags | default([]) + ['telemetry']) | unique }}"
        cacheable: true

- name: Invoke validate_config.yml to perform L1 and L2 validations
  ansible.builtin.import_playbook: ../input_validation/validate_config.yml

- name: Invoke get_config_credentials.yml
  ansible.builtin.import_playbook: ../utils/credential_utility/get_config_credentials.yml

- name: Include input project directory
  when: not project_dir_status | default(false) | bool
  ansible.builtin.import_playbook: ../utils/include_input_dir.yml

- name: Validate telemetry input parameters
  hosts: localhost
  connection: local
  any_errors_fatal: true
  tasks:
    - name: Validate telemetry input parameters
      ansible.builtin.include_role:
        name: telemetry_validation
        tasks_from: validation_status_check.yml


- name: Deployment of telemetry pods in service cluster
  hosts: service_kube_cp_group
  connection: ssh
  gather_facts: false
  tasks:
    - name: Deployment of telemetry pods
      ansible.builtin.include_role:
        name: service_k8s_telemetry

- name: Enable idrac telemetry
  hosts: service_kube_cp_group
  gather_facts: false
  tasks:
    - name: Enable idrac telemetry
      ansible.builtin.include_role:
        name: idrac_telemetry

- name: Detailed Telemetry Report
  hosts: localhost
  connection: local
  gather_facts: false
  vars:
    telemetry_report_path: "/opt/omnia/telemetry/idrac_telemetry_report.yml"
  tasks:
    - name: Detailed Telemetry Report
      ansible.builtin.debug:
        msg: "Check the file at {{ telemetry_report_path }} in omnia_core container for detailed telemetry report."
      when:
        - hostvars['localhost']['idrac_telemetry_support']


================================================
FILE: upgrade/ansible.cfg
================================================
[defaults]
log_path = /opt/omnia/log/core/playbooks/upgrade.log
remote_tmp = /opt/omnia/tmp/.ansible/tmp/
host_key_checking = false
forks = 5
timeout = 180
executable = /bin/bash
library = ../common/library/modules
module_utils = ../common/library/module_utils

[persistent_connection]
command_timeout = 180
connect_timeout = 180

[ssh_connection]
retries = 3
ssh_args = -o ControlMaster=auto -o ControlPersist=60 -o ConnectTimeout=60


================================================
FILE: upgrade/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---


================================================
FILE: upgrade/roles/import_input_parameters/tasks/display_warnings.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Display collected warnings
  ansible.builtin.debug:
    msg: |
      =================================
           UPGRADE WARNINGS SUMMARY
      =================================

      {{ upgrade_warnings | length }} warning{{ 's' if upgrade_warnings | length > 1 else '' }} detected.
      You will now be shown the detailed list.
  when:
    - upgrade_warnings is defined
    - upgrade_warnings | length > 0


- name: Pause for user to review warnings
  ansible.builtin.pause:
    seconds: 30
    prompt: |
      ╔════════════════════════════════════════════╗
      ║       ⚠️  UPGRADE WARNINGS REVIEW  ⚠️        ║
      ╚════════════════════════════════════════════╝

      {{ upgrade_warnings | length }} warning{{ 's' if upgrade_warnings | length > 1 else '' }} detected:

      {% for warning in upgrade_warnings %}
      {{ loop.index }}. {{ warning }}
      {% endfor %}

      Please review these warnings carefully.
      Press ENTER to continue or CTRL+C to abort.
      Continuing automatically in 30 seconds...
  when:
    - upgrade_warnings is defined
    - upgrade_warnings | length > 0


================================================
FILE: upgrade/roles/import_input_parameters/tasks/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Set backup location based on oim_metadata.yml
  ansible.builtin.include_tasks: set_backup_location.yml

- name: Validate backup location for upgrade input processing
  ansible.builtin.include_tasks: precheck_backup_location.yml

- name: Transform network_spec.yml from Omnia 2.0 to 2.1
  ansible.builtin.include_tasks: transform_network_spec.yml

- name: Transform high_availability_config.yml from Omnia 2.0 to 2.1
  ansible.builtin.include_tasks: transform_high_availability_config.yml

- name: Transform local_repo_config.yml from Omnia 2.0 to 2.1
  ansible.builtin.include_tasks: transform_local_repo_config.yml

- name: Transform provision_config.yml from Omnia 2.0 to 2.1
  ansible.builtin.include_tasks: transform_provision_config.yml

- name: Transform storage_config.yml from Omnia 2.0 to 2.1
  ansible.builtin.include_tasks: transform_storage_config.yml

- name: Transform omnia_config.yml from Omnia 2.0 to 2.1
  ansible.builtin.include_tasks: transform_omnia_config.yml

- name: Transform telemetry_config.yml from Omnia 2.0 to 2.1
  ansible.builtin.include_tasks: transform_telemetry_config.yml

- name: Restore input files from backup
  ansible.builtin.include_tasks: restore_input_files.yml

- name: Restore user_registry_credential.yml from backup
  ansible.builtin.include_tasks: restore_user_registry_credential.yml

- name: Restore omnia_config_credentials.yml from backup
  ansible.builtin.include_tasks: restore_omnia_config_credentials.yml

- name: Display upgrade warnings summary
  ansible.builtin.include_tasks: display_warnings.yml


================================================
FILE: upgrade/roles/import_input_parameters/tasks/precheck_backup_location.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Validate backup_location is provided
  ansible.builtin.fail:
    msg: "{{ msg_backup_location_missing }}"
  when: backup_location is not defined or (backup_location | string | trim) == ""

- name: Ensure backup directory exists
  ansible.builtin.file:
    path: "{{ backup_location }}"
    state: directory
    mode: "{{ backup_dir_mode }}"


================================================
FILE: upgrade/roles/import_input_parameters/tasks/restore_input_files.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Validate restore_input_files is defined
  ansible.builtin.set_fact:
    restore_input_files_effective: "{{ restore_input_files | default([]) }}"

- name: Restore input files from backup (overwrite target)
  ansible.builtin.include_tasks: restore_single_input_file.yml
  loop: "{{ restore_input_files_effective }}"
  loop_control:
    loop_var: restore_item
  when: (restore_input_files_effective | length) > 0


================================================
FILE: upgrade/roles/import_input_parameters/tasks/restore_omnia_config_credentials.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Check if backup omnia_config_credentials.yml exists
  ansible.builtin.stat:
    path: "{{ backup_location }}/omnia_config_credentials.yml"
  register: backup_omnia_config_credentials_stat

- name: Check if backup omnia_config_credentials_key exists
  ansible.builtin.stat:
    path: "{{ backup_location }}/.omnia_config_credentials_key"
  register: backup_omnia_config_credentials_key_stat

- name: Add warning for missing omnia_config_credentials.yml to list
  ansible.builtin.set_fact:
    upgrade_warnings: >-
      {{ upgrade_warnings + [msg_omnia_config_credentials_missing] }}
  when:
    - not backup_omnia_config_credentials_stat.stat.exists
    - "'WARNING: omnia_config_credentials.yml not found in backup at' not in (upgrade_warnings | join(' '))"

- name: Check if backup file is encrypted
  ansible.builtin.command:
    cmd: cat "{{ backup_location }}/omnia_config_credentials.yml"
  register: backup_omnia_config_credentials_content
  changed_when: false
  failed_when: false
  no_log: true
  when: backup_omnia_config_credentials_stat.stat.exists

- name: Fail if file present but key missing
  when: >-
    backup_omnia_config_credentials_stat.stat.exists and
    not backup_omnia_config_credentials_key_stat.stat.exists
  ansible.builtin.fail:
    msg: "{{ msg_omnia_config_credentials_error }}"

- name: Process omnia_config_credentials.yml when present in backup (key present)
  when: >-
    backup_omnia_config_credentials_stat.stat.exists and
    backup_omnia_config_credentials_key_stat.stat.exists
  block:
    - name: Copy omnia_config_credentials_key from backup
      ansible.builtin.copy:
        src: "{{ backup_location }}/.omnia_config_credentials_key"
        dest: "{{ input_project_dir }}/.omnia_config_credentials_key"
        mode: '0600'
        remote_src: true

    - name: Set flag if backup file is encrypted
      ansible.builtin.set_fact:
        omnia_creds_encrypted: "{{ '$ANSIBLE_VAULT;' in (backup_omnia_config_credentials_content.stdout | default('')) }}"

    - name: "Case 1: Encrypted file - decrypt, template, re-encrypt"
      when: omnia_creds_encrypted | bool
      block:
        - name: Copy encrypted omnia_config_credentials.yml from backup to temp location
          ansible.builtin.copy:
            src: "{{ backup_location }}/omnia_config_credentials.yml"
            dest: "{{ input_project_dir }}/omnia_config_credentials.yml.tmp"
            mode: '0600'
            remote_src: true

        - name: Decrypt omnia_config_credentials.yml using the key
          ansible.builtin.shell:
            cmd: |
              ansible-vault decrypt "{{ input_project_dir }}/omnia_config_credentials.yml.tmp" \
                --vault-password-file "{{ input_project_dir }}/.omnia_config_credentials_key" \
                --output "{{ input_project_dir }}/omnia_config_credentials.yml.decrypted"
          args:
            executable: /bin/bash
          no_log: true
          register: vault_decrypt_result
          failed_when: vault_decrypt_result.rc != 0
          changed_when: false

        - name: Read decrypted content
          ansible.builtin.slurp:
            src: "{{ input_project_dir }}/omnia_config_credentials.yml.decrypted"
          register: decrypted_content
          no_log: true

        - name: Parse YAML content and extract credentials
          ansible.builtin.set_fact:
            credentials_dict: >-
              {{ decrypted_content.content | b64decode | from_yaml }}
          no_log: true

      rescue:
        - name: Fail with decryption error message
          ansible.builtin.fail:
            msg: "{{ msg_omnia_config_decrypt_error }}"

    - name: "Case 2: Plaintext file - read, template, encrypt"
      when: not (omnia_creds_encrypted | bool)
      block:
        - name: Read plaintext omnia_config_credentials.yml from backup
          ansible.builtin.slurp:
            src: "{{ backup_location }}/omnia_config_credentials.yml"
          register: plaintext_credentials
          no_log: true

        - name: Parse plaintext credentials
          ansible.builtin.set_fact:
            credentials_dict: >-
              {{ plaintext_credentials.content | b64decode | from_yaml }}
          no_log: true

    - name: Set template variables from credentials
      ansible.builtin.set_fact:
        provision_password: "{{ credentials_dict.provision_password | default('') }}"
        bmc_username: "{{ credentials_dict.bmc_username | default('') }}"
        bmc_password: "{{ credentials_dict.bmc_password | default('') }}"
        minio_s3_password: "{{ credentials_dict.minio_s3_password | default('') }}"
        pulp_password: "{{ credentials_dict.pulp_password | default('') }}"
        docker_username: "{{ credentials_dict.docker_username | default('') }}"
        docker_password: "{{ credentials_dict.docker_password | default('') }}"
        slurm_db_password: "{{ credentials_dict.slurm_db_password | default('') }}"
        openldap_db_username: "{{ credentials_dict.openldap_db_username | default('') }}"
        openldap_db_password: "{{ credentials_dict.openldap_db_password | default('') }}"
        mysqldb_user: "{{ credentials_dict.mysqldb_user | default('') }}"
        mysqldb_password: "{{ credentials_dict.mysqldb_password | default('') }}"
        mysqldb_root_password: "{{ credentials_dict.mysqldb_root_password | default('') }}"
        csi_username: "{{ credentials_dict.csi_username | default('') }}"
        csi_password: "{{ credentials_dict.csi_password | default('') }}"
        ldms_sampler_password: "{{ credentials_dict.ldms_sampler_password | default('') }}"
        gitlab_root_password: "{{ credentials_dict.gitlab_root_password | default('') }}"
      no_log: true

    - name: Write updated content using template
      ansible.builtin.template:
        src: omnia_config_credentials.yml.j2
        dest: "{{ input_project_dir }}/omnia_config_credentials.yml.decrypted"
        mode: '0600'
      no_log: true

    - name: Encrypt updated file using the key
      ansible.builtin.shell:
        cmd: |
          ansible-vault encrypt "{{ input_project_dir }}/omnia_config_credentials.yml.decrypted" \
            --vault-password-file "{{ input_project_dir }}/.omnia_config_credentials_key" \
            --output "{{ input_project_dir }}/omnia_config_credentials.yml"
      args:
        executable: /bin/bash
      no_log: true
      register: vault_encrypt_result
      failed_when: vault_encrypt_result.rc != 0
      changed_when: false

    - name: Clean up temporary files
      ansible.builtin.file:
        path: "{{ item }}"
        state: absent
      loop:
        - "{{ input_project_dir }}/omnia_config_credentials.yml.tmp"
        - "{{ input_project_dir }}/omnia_config_credentials.yml.decrypted"

    - name: Mark credentials processed
      ansible.builtin.set_fact:
        omnia_creds_processed: true

    - name: Display success message
      ansible.builtin.debug:
        msg: "{{ msg_omnia_config_credentials_success }}"

  rescue:
    - name: Fail with template/encryption error message
      ansible.builtin.fail:
        msg: "{{ msg_omnia_config_template_error }}\n{{ msg_omnia_config_encrypt_error }}"

- name: "Case 3: Both key and file missing - Add info warning"
  when: >
    (not (omnia_creds_processed | default(false) | bool)) and
    not backup_omnia_config_credentials_key_stat.stat.exists and
    (backup_omnia_config_credentials_content.stdout is not defined or
     '$ANSIBLE_VAULT;' not in backup_omnia_config_credentials_content.stdout) and
    "'INFO: Both omnia_config_credentials.yml and .omnia_config_credentials_key' not in (upgrade_warnings | join(' '))"
  ansible.builtin.set_fact:
    upgrade_warnings: >
      {{ upgrade_warnings + [msg_omnia_config_credentials_info_missing] }}

- name: "Case 4: Error - Mismatched state"
  when: >
    (not (omnia_creds_processed | default(false) | bool)) and
    (
      (not backup_omnia_config_credentials_key_stat.stat.exists and
       backup_omnia_config_credentials_content.stdout is defined and
       '$ANSIBLE_VAULT;' in backup_omnia_config_credentials_content.stdout)
      or
      (backup_omnia_config_credentials_key_stat.stat.exists and
       backup_omnia_config_credentials_content.stdout is defined and
       '$ANSIBLE_VAULT;' not in backup_omnia_config_credentials_content.stdout)
    )
  ansible.builtin.fail:
    msg: "{{ msg_omnia_config_credentials_error }}"


================================================
FILE: upgrade/roles/import_input_parameters/tasks/restore_single_input_file.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Validate restore item fields
  ansible.builtin.fail:
    msg: "{{ msg_restore_item_name_missing }}"
  when: restore_item.name is not defined or (restore_item.name | string | trim) == ""

- name: Check if backup file exists
  ansible.builtin.stat:
    path: "{{ backup_location }}/{{ restore_item.name }}"
  register: restore_backup_stat

- name: Fail if backup file is not present
  ansible.builtin.fail:
    msg: "{{ msg_backup_file_missing }}"
  when: not restore_backup_stat.stat.exists

- name: Overwrite input file from backup
  ansible.builtin.copy:
    src: "{{ backup_location }}/{{ restore_item.name }}"
    dest: "{{ input_project_dir }}/{{ restore_item.name }}"
    mode: "{{ restore_item.mode | default(default_file_mode) }}"
    remote_src: true

- name: Validate restored file (optional)
  ansible.builtin.command:
    cmd: "{{ restore_item.validate_cmd }}"
  register: restore_validate
  changed_when: false
  when: restore_item.validate_cmd is defined and (restore_item.validate_cmd | string | trim) != ""

- name: Fail if restored file validation fails
  ansible.builtin.fail:
    msg: "{{ msg_validation_failed }}"
  when:
    - restore_item.validate_cmd is defined and (restore_item.validate_cmd | string | trim) != ""
    - restore_validate.rc != 0

- name: Display restore summary
  ansible.builtin.debug:
    msg: "{{ msg_restore_summary }}"


================================================
FILE: upgrade/roles/import_input_parameters/tasks/restore_user_registry_credential.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Check if backup user_registry_credential.yml exists
  ansible.builtin.stat:
    path: "{{ backup_location }}/{{ user_registry_file_name }}"
  register: backup_user_registry_credential_stat

- name: Check if user_registry_credential.yml exists in current directory
  ansible.builtin.stat:
    path: "{{ input_project_dir }}/{{ user_registry_file_name }}"
  register: user_registry_credential_stat

- name: Check if backup local_repo_credentials_key exists
  ansible.builtin.stat:
    path: "{{ backup_location }}/{{ user_registry_key_name }}"
  register: backup_local_repo_credentials_key_stat

- name: Add warning for missing user_registry_credential.yml to list
  ansible.builtin.set_fact:
    upgrade_warnings: >-
      {{ upgrade_warnings + [msg_user_registry_credential_missing] }}
  when:
    - not backup_user_registry_credential_stat.stat.exists
    - "'WARNING: user_registry_credential.yml not found in backup at' not in (upgrade_warnings | join(' '))"

- name: Check if backup file is encrypted
  ansible.builtin.command:
    cmd: cat "{{ backup_location }}/{{ user_registry_file_name }}"
  register: backup_user_registry_content
  changed_when: false
  failed_when: false
  no_log: true
  when: backup_user_registry_credential_stat.stat.exists

- name: Process user_registry_credential.yml when present in backup
  when: backup_user_registry_content.stdout is defined
  block:

    - name: "Case 1: Key present and file encrypted - Copy both"
      when: >
        backup_local_repo_credentials_key_stat.stat.exists and
        backup_user_registry_content.stdout is defined and
        '$ANSIBLE_VAULT;' in backup_user_registry_content.stdout
      block:
        - name: Copy encrypted user_registry_credential.yml from backup
          ansible.builtin.copy:
            src: "{{ backup_location }}/{{ user_registry_file_name }}"
            dest: "{{ input_project_dir }}/{{ user_registry_file_name }}"
            mode: "{{ user_registry_file_mode }}"
            force: true
            remote_src: true

        - name: Copy local_repo_credentials_key from backup
          ansible.builtin.copy:
            src: "{{ backup_location }}/{{ user_registry_key_name }}"
            dest: "{{ input_project_dir }}/{{ user_registry_key_name }}"
            mode: "{{ user_registry_key_mode }}"
            force: true
            remote_src: true

        - name: Display success message for encrypted file restoration
          ansible.builtin.debug:
            msg: "{{ msg_user_registry_encrypted_success }}"
      rescue:
        - name: Fail with decryption error message
          ansible.builtin.fail:
            msg: "{{ msg_user_registry_decrypt_error }}"

    - name: "Case 2: Both key and file missing - Add info warning"
      when: >-
        not backup_local_repo_credentials_key_stat.stat.exists and
        (backup_user_registry_content.stdout is not defined or
         '$ANSIBLE_VAULT;' not in backup_user_registry_content.stdout) and
        "'INFO: Both user_registry_credential.yml and .local_repo_credentials_key' not in (upgrade_warnings | join(' '))"
      ansible.builtin.set_fact:
        upgrade_warnings: >-
          {{ upgrade_warnings + [
            "INFO: Both user_registry_credential.yml and .local_repo_credentials_key " +
            "are not present in backup. This is expected if registry credentials " +
            "were not configured in the source installation."
          ] }}

    - name: "Case 3a: File not encrypted but key present - copy and encrypt"
      when: >-
        backup_local_repo_credentials_key_stat.stat.exists and
        backup_user_registry_content.stdout is defined and
        '$ANSIBLE_VAULT;' not in backup_user_registry_content.stdout
      block:
        - name: Copy local_repo_credentials_key from backup (unencrypted case)
          ansible.builtin.copy:
            src: "{{ backup_location }}/{{ user_registry_key_name }}"
            dest: "{{ input_project_dir }}/{{ user_registry_key_name }}"
            mode: "{{ user_registry_key_mode }}"
            force: true
            remote_src: true

        - name: Copy user_registry_credential.yml from backup (unencrypted)
          ansible.builtin.copy:
            src: "{{ backup_location }}/{{ user_registry_file_name }}"
            dest: "{{ input_project_dir }}/{{ user_registry_file_name }}"
            mode: "{{ user_registry_file_mode }}"
            force: true
            remote_src: true

        - name: Encrypt user_registry_credential.yml with provided key
          ansible.builtin.shell:
            cmd: |
              ansible-vault encrypt "{{ input_project_dir }}/{{ user_registry_file_name }}" \
                --vault-password-file "{{ input_project_dir }}/{{ user_registry_key_name }}"
          args:
            executable: /bin/bash
          no_log: true
          register: vault_encrypt_result
          failed_when: vault_encrypt_result.rc != 0
          changed_when: false

        - name: Display success message for encrypting plaintext file
          ansible.builtin.debug:
            msg: "{{ msg_user_registry_plaintext_encrypted_success }}"

    - name: "Case 3b: Error - Encrypted file but key missing"
      when: >-
        not backup_local_repo_credentials_key_stat.stat.exists and
        backup_user_registry_content.stdout is defined and
        '$ANSIBLE_VAULT;' in backup_user_registry_content.stdout
      ansible.builtin.fail:
        msg: "{{ msg_user_registry_encrypted_missing_key }}"

    - name: "Case 3c: File plaintext and key missing - copy file only"
      when: >-
        not backup_local_repo_credentials_key_stat.stat.exists and
        backup_user_registry_content.stdout is defined and
        '$ANSIBLE_VAULT;' not in backup_user_registry_content.stdout
      block:
        - name: Copy user_registry_credential.yml from backup (plaintext, no key)
          ansible.builtin.copy:
            src: "{{ backup_location }}/{{ user_registry_file_name }}"
            dest: "{{ input_project_dir }}/{{ user_registry_file_name }}"
            mode: "{{ user_registry_file_mode }}"
            force: true
            remote_src: true

        - name: Warn about plaintext copy without key
          ansible.builtin.debug:
            msg: "{{ msg_user_registry_plaintext_no_key }}"


================================================
FILE: upgrade/roles/import_input_parameters/tasks/set_backup_location.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Read oim_metadata.yml to get upgrade_backup_dir
  ansible.builtin.slurp:
    src: "{{ oim_metadata_path }}"
  register: oim_metadata_slurp

- name: Parse oim_metadata.yml
  ansible.builtin.set_fact:
    oim_metadata: "{{ oim_metadata_slurp.content | b64decode | from_yaml }}"

- name: Set backup_location from metadata
  ansible.builtin.set_fact:
    backup_location: "{{ oim_metadata.upgrade_backup_dir }}/input/project_default"
  when: oim_metadata.upgrade_backup_dir is defined

- name: Fail if upgrade_backup_dir is not defined in metadata
  ansible.builtin.fail:
    msg: "{{ msg_upgrade_backup_dir_missing }}"
  when: oim_metadata.upgrade_backup_dir is not defined


================================================
FILE: upgrade/roles/import_input_parameters/tasks/transform_high_availability_config.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Check if backup high_availability_config.yml exists
  ansible.builtin.stat:
    path: "{{ backup_location }}/high_availability_config.yml"
  register: backup_ha_config_stat

- name: Fail if backup high_availability_config.yml is not present
  ansible.builtin.fail:
    msg: "{{ msg_backup_ha_config_missing }}"
  when: not backup_ha_config_stat.stat.exists

- name: Check if high_availability_config.yml exists
  ansible.builtin.stat:
    path: "{{ input_project_dir }}/high_availability_config.yml"
  register: ha_config_stat

- name: Fail if high_availability_config.yml is not present
  ansible.builtin.fail:
    msg: "{{ msg_ha_config_missing }}"
  when: not ha_config_stat.stat.exists

- name: Read backup high_availability_config.yml (source of truth)
  ansible.builtin.slurp:
    src: "{{ backup_location }}/high_availability_config.yml"
  register: backup_ha_config_slurp

- name: Parse backup high_availability_config.yml
  ansible.builtin.set_fact:
    backup_ha_config: "{{ backup_ha_config_slurp.content | b64decode | from_yaml }}"

- name: Normalize service_k8s_cluster_ha to a list
  ansible.builtin.set_fact:
    ha_service_k8s_cluster_ha: >-
      {{
        (
          [backup_ha_config.service_k8s_cluster_ha]
          if (backup_ha_config.service_k8s_cluster_ha is mapping)
          else (backup_ha_config.service_k8s_cluster_ha | default([]))
        )
      }}

- name: Collect HA entries missing virtual_ip_address
  ansible.builtin.set_fact:
    ha_entries_missing_vip: >-
      {{
        (ha_service_k8s_cluster_ha | default([]))
        | select('mapping')
        | selectattr('virtual_ip_address', 'undefined')
        | map(attribute='cluster_name')
        | list
      }}

- name: Collect HA entries with empty virtual_ip_address
  ansible.builtin.set_fact:
    ha_entries_empty_vip: >-
      {{
        (ha_service_k8s_cluster_ha | default([]))
        | select('mapping')
        | selectattr('virtual_ip_address', 'defined')
        | selectattr('virtual_ip_address', 'match', '^\\s*$')
        | map(attribute='cluster_name')
        | list
      }}

- name: Fail if virtual_ip_address is missing
  ansible.builtin.fail:
    msg: "{{ msg_ha_virtual_ip_missing }}"
  when:
    - (ha_service_k8s_cluster_ha | default([]) | length) == 0
      or ((ha_entries_missing_vip | default([]) | length) > 0)
      or ((ha_entries_empty_vip | default([]) | length) > 0)

- name: Write high_availability_config.yml in Omnia 2.1 format
  ansible.builtin.template:
    src: high_availability_config.j2
    dest: "{{ input_project_dir }}/high_availability_config.yml"
    mode: "{{ default_file_mode }}"
  vars:
    ha_service_k8s_cluster_ha: "{{ ha_service_k8s_cluster_ha }}"

- name: Validate YAML syntax of transformed high_availability_config.yml
  ansible.builtin.command:
    cmd: python3 -c "import yaml; yaml.safe_load(open('{{ input_project_dir }}/high_availability_config.yml','r'))"
  register: ha_yaml_validation
  changed_when: false

- name: Fail if YAML validation fails
  ansible.builtin.fail:
    msg: "{{ msg_yaml_validation_failed }}"
  when:
    - ha_yaml_validation.rc != 0

- name: Display backup path (no-op when skipped)
  ansible.builtin.debug:
    msg: "{{ msg_using_backup_ha_config }}"
  when: true

- name: Display transformation summary
  ansible.builtin.debug:
    msg: "{{ msg_ha_config_transform_summary }}"


================================================
FILE: upgrade/roles/import_input_parameters/tasks/transform_local_repo_config.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Check if backup local_repo_config.yml exists
  ansible.builtin.stat:
    path: "{{ backup_location }}/local_repo_config.yml"
  register: backup_local_repo_config_stat

- name: Fail if backup local_repo_config.yml is not present
  ansible.builtin.fail:
    msg: "{{ msg_backup_local_repo_config_missing }}"
  when: not backup_local_repo_config_stat.stat.exists

- name: Check if local_repo_config.yml exists
  ansible.builtin.stat:
    path: "{{ input_project_dir }}/local_repo_config.yml"
  register: local_repo_config_stat

- name: Fail if local_repo_config.yml is not present
  ansible.builtin.fail:
    msg: "{{ msg_local_repo_config_missing }}"
  when: not local_repo_config_stat.stat.exists

- name: Read backup local_repo_config.yml (source of truth)
  ansible.builtin.slurp:
    src: "{{ backup_location }}/local_repo_config.yml"
  register: backup_local_repo_config_slurp

- name: Parse backup local_repo_config.yml
  ansible.builtin.set_fact:
    backup_local_repo_config: "{{ backup_local_repo_config_slurp.content | b64decode | from_yaml }}"

- name: Normalize user_registry
  ansible.builtin.set_fact:
    local_repo_user_registry: >-
      {{
        (
          backup_local_repo_config.user_registry
          if (backup_local_repo_config.user_registry is defined)
          else
            (
              (
                (backup_local_repo_config.omnia_registry | default([]))
                | select('string')
                | map('regex_replace', '^(.*)$', '{"host": "\\1", "cert_path": "", "key_path": ""}')
                | map('from_json')
                | list
              )
            )
        )
      }}

- name: Normalize repo url keys to 2.1 schema
  ansible.builtin.set_fact:
    local_repo_user_repo_url_x86_64: "{{
      backup_local_repo_config.user_repo_url_x86_64 |
      default(backup_local_repo_config.user_repo |
      default([]))
    }}"
    local_repo_user_repo_url_aarch64: "{{ backup_local_repo_config.user_repo_url_aarch64 | default([]) }}"
    local_repo_rhel_os_url_x86_64: "{{
      backup_local_repo_config.rhel_os_url_x86_64 |
      default(backup_local_repo_config.rhel_os_url |
      default([]))
    }}"
    local_repo_rhel_os_url_aarch64: "{{ backup_local_repo_config.rhel_os_url_aarch64 | default([]) }}"
    local_repo_omnia_repo_url_rhel_x86_64: "{{
      backup_local_repo_config.omnia_repo_url_rhel_x86_64 |
      default(backup_local_repo_config.omnia_repo_url_rhel |
      default([]))
    }}"
    local_repo_omnia_repo_url_rhel_aarch64: "{{
      backup_local_repo_config.omnia_repo_url_rhel_aarch64 |
      default(backup_local_repo_config.omnia_repo_url_rhel |
      default([]))
    }}"
    local_repo_additional_repos_x86_64: "{{
      backup_local_repo_config.additional_repos_x86_64 |
      default(backup_local_repo_config.additional_repos |
      default([]))
    }}"
    local_repo_additional_repos_aarch64: "{{ backup_local_repo_config.additional_repos_aarch64 | default([]) }}"

- name: Fail if omnia_repo_url_rhel_x86_64 is missing
  ansible.builtin.fail:
    msg: "{{ msg_omnia_repo_url_rhel_x86_64_missing }}"
  when: (local_repo_omnia_repo_url_rhel_x86_64 | default([]) | length) == 0

- name: Fail if omnia_repo_url_rhel_aarch64 is missing
  ansible.builtin.fail:
    msg: "{{ msg_omnia_repo_url_rhel_aarch64_missing }}"
  when: (local_repo_omnia_repo_url_rhel_aarch64 | default([]) | length) == 0

- name: Write local_repo_config.yml in Omnia 2.1 format
  ansible.builtin.template:
    src: local_repo_config.j2
    dest: "{{ input_project_dir }}/local_repo_config.yml"
    mode: "{{ default_file_mode }}"
  vars:
    local_repo_user_registry: "{{ local_repo_user_registry }}"
    local_repo_user_repo_url_x86_64: "{{ local_repo_user_repo_url_x86_64 }}"
    local_repo_user_repo_url_aarch64: "{{ local_repo_user_repo_url_aarch64 }}"
    local_repo_rhel_os_url_x86_64: "{{ local_repo_rhel_os_url_x86_64 }}"
    local_repo_rhel_os_url_aarch64: "{{ local_repo_rhel_os_url_aarch64 }}"
    local_repo_omnia_repo_url_rhel_x86_64: "{{ local_repo_omnia_repo_url_rhel_x86_64 }}"
    local_repo_omnia_repo_url_rhel_aarch64: "{{ local_repo_omnia_repo_url_rhel_aarch64 }}"
    local_repo_additional_repos_x86_64: "{{ local_repo_additional_repos_x86_64 }}"
    local_repo_additional_repos_aarch64: "{{ local_repo_additional_repos_aarch64 }}"

- name: Validate YAML syntax of transformed local_repo_config.yml
  ansible.builtin.command:
    cmd: python3 -c "import yaml; yaml.safe_load(open('{{ input_project_dir }}/local_repo_config.yml','r'))"
  register: local_repo_yaml_validation
  changed_when: false

- name: Fail if YAML validation fails
  ansible.builtin.fail:
    msg: "{{ msg_yaml_validation_failed }}"
  when:
    - local_repo_yaml_validation.rc != 0

- name: Display backup path (no-op when skipped)
  ansible.builtin.debug:
    msg: "{{ msg_using_backup_local_repo_config }}"
  when: true

- name: Display transformation summary
  ansible.builtin.debug:
    msg: "{{ msg_local_repo_config_transform_summary }}"


================================================
FILE: upgrade/roles/import_input_parameters/tasks/transform_network_spec.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Check if backup network_spec.yml exists
  ansible.builtin.stat:
    path: "{{ backup_location }}/network_spec.yml"
  register: backup_network_spec_stat

- name: Fail if backup network_spec.yml is not present
  ansible.builtin.fail:
    msg: "{{ msg_backup_network_spec_missing }}"
  when: not backup_network_spec_stat.stat.exists

- name: Check if network_spec.yml exists
  ansible.builtin.stat:
    path: "{{ input_project_dir }}/network_spec.yml"
  register: network_spec_stat

- name: Fail if network_spec.yml is not present
  ansible.builtin.fail:
    msg: "{{ msg_network_spec_missing }}"
  when: not network_spec_stat.stat.exists

- name: Read backup network_spec.yml (source of truth)
  ansible.builtin.slurp:
    src: "{{ backup_location }}/network_spec.yml"
  register: backup_network_spec_slurp

- name: Parse backup network_spec.yml
  ansible.builtin.set_fact:
    backup_network_spec: "{{ backup_network_spec_slurp.content | b64decode | from_yaml }}"

- name: Extract admin_network and ib_network from backup file
  ansible.builtin.set_fact:
    admin_network: >-
      {{
        (backup_network_spec.admin_network
          if (backup_network_spec is mapping and backup_network_spec.admin_network is defined)
          else
            (
              (backup_network_spec.Networks | default([])
                | select('mapping')
                | selectattr('admin_network', 'defined')
                | map(attribute='admin_network')
                | first
              ) | default({})
            )
        )
      }}
    ib_network: >-
      {{
        (backup_network_spec.ib_network
          if (backup_network_spec is mapping and backup_network_spec.ib_network is defined)
          else
            (
              (backup_network_spec.Networks | default([])
                | select('mapping')
                | selectattr('ib_network', 'defined')
                | map(attribute='ib_network')
                | first
              ) | default({})
            )
        )
      }}
  when:
    - true

- name: Render network_spec.yml in Omnia 2.1 format
  ansible.builtin.template:
    src: network_spec.j2
    dest: "{{ input_project_dir }}/network_spec.yml"
    mode: "{{ default_file_mode }}"
  vars:
    admin_network_netmask_bits: "{{ admin_network.netmask_bits | default('24') }}"
  when: true

- name: Read transformed network_spec.yml
  ansible.builtin.slurp:
    src: "{{ input_project_dir }}/network_spec.yml"
  register: network_spec_21_slurp
  when: true

- name: Parse transformed network_spec.yml
  ansible.builtin.set_fact:
    network_spec_21: "{{ network_spec_21_slurp.content | b64decode | from_yaml }}"
  when: true

- name: Validate YAML syntax of transformed network_spec.yml
  ansible.builtin.command:
    cmd: python3 -c "import yaml; yaml.safe_load(open('{{ input_project_dir }}/network_spec.yml','r'))"
  register: network_spec_yaml_validation
  changed_when: false
  when: true

- name: Fail if YAML validation fails
  ansible.builtin.fail:
    msg: "{{ msg_yaml_validation_failed }}"
  when:
    - network_spec_yaml_validation.rc != 0

- name: Ensure ib_network.netmask_bits matches admin_network.netmask_bits
  ansible.builtin.fail:
    msg: "{{ msg_ib_netmask_mismatch }}"
  when:
    - >-
      (ib_network.netmask_bits | default(admin_network.netmask_bits | default('24')) | string)
      != (admin_network.netmask_bits | default('24') | string)

- name: Display backup path (no-op when skipped)
  ansible.builtin.debug:
    msg: "{{ msg_using_backup_network_spec }}"
  when: true

- name: Validate mandatory ib_network is present in transformed output
  ansible.builtin.fail:
    msg: "{{ msg_ib_network_missing }}"
  when:
    - >-
      (network_spec_21.Networks is not defined)
      or ((network_spec_21.Networks | select('mapping') | selectattr('ib_network', 'defined') | list | length) == 0)

- name: Extract ib_network subnet from transformed output
  ansible.builtin.set_fact:
    ib_network_subnet: >-
      {{
        (
          network_spec_21.Networks
          | select('mapping')
          | selectattr('ib_network', 'defined')
          | map(attribute='ib_network')
          | first
          | default({})
        ).subnet | default('')
      }}

- name: Validate mandatory ib_network.subnet is present in transformed output
  ansible.builtin.fail:
    msg: "{{ msg_ib_subnet_missing }}"
  when:
    - >-
      (ib_network_subnet | string | trim) == ''

- name: Display transformation summary
  ansible.builtin.debug:
    msg: "{{ msg_network_spec_transform_summary }}"


================================================
FILE: upgrade/roles/import_input_parameters/tasks/transform_omnia_config.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Check if backup omnia_config.yml exists
  ansible.builtin.stat:
    path: "{{ backup_location }}/omnia_config.yml"
  register: backup_omnia_config_stat

- name: Fail if backup omnia_config.yml is not present
  ansible.builtin.fail:
    msg: "{{ msg_backup_omnia_config_missing }}"
  when: not backup_omnia_config_stat.stat.exists

- name: Check if omnia_config.yml exists
  ansible.builtin.stat:
    path: "{{ input_project_dir }}/omnia_config.yml"
  register: omnia_config_stat

- name: Fail if omnia_config.yml is not present
  ansible.builtin.fail:
    msg: "{{ msg_omnia_config_missing }}"
  when: not omnia_config_stat.stat.exists

- name: Read backup omnia_config.yml (source of truth)
  ansible.builtin.slurp:
    src: "{{ backup_location }}/omnia_config.yml"
  register: backup_omnia_config_slurp

- name: Parse backup omnia_config.yml
  ansible.builtin.set_fact:
    backup_omnia_config: "{{ backup_omnia_config_slurp.content | b64decode | from_yaml }}"

- name: Normalize omnia_config.yml values
  ansible.builtin.set_fact:
    omnia_slurm_cluster_raw: "{{ backup_omnia_config.slurm_cluster | default([]) }}"
    omnia_service_k8s_cluster_raw: "{{ backup_omnia_config.service_k8s_cluster | default([]) }}"

- name: Ensure slurm_cluster and service_k8s_cluster are lists
  ansible.builtin.set_fact:
    omnia_slurm_cluster: >-
      {{
        [omnia_slurm_cluster_raw]
        if (omnia_slurm_cluster_raw is mapping)
        else omnia_slurm_cluster_raw
      }}
    omnia_service_k8s_cluster: >-
      {{
        [omnia_service_k8s_cluster_raw]
        if (omnia_service_k8s_cluster_raw is mapping)
        else omnia_service_k8s_cluster_raw
      }}

- name: Fail if slurm_cluster is missing
  ansible.builtin.fail:
    msg: "{{ msg_slurm_cluster_missing }}"
  when: (omnia_slurm_cluster | default([]) | length) == 0

- name: Fail if service_k8s_cluster is missing
  ansible.builtin.fail:
    msg: "{{ msg_service_k8s_cluster_missing }}"
  when: (omnia_service_k8s_cluster | default([]) | length) == 0

- name: Write omnia_config.yml in Omnia 2.1 format
  ansible.builtin.template:
    src: omnia_config.j2
    dest: "{{ input_project_dir }}/omnia_config.yml"
    mode: "{{ default_file_mode }}"
  vars:
    omnia_slurm_cluster: "{{ omnia_slurm_cluster }}"
    omnia_service_k8s_cluster: "{{ omnia_service_k8s_cluster }}"

- name: Validate YAML syntax of transformed omnia_config.yml
  ansible.builtin.command:
    cmd: python3 -c "import yaml; yaml.safe_load(open('{{ input_project_dir }}/omnia_config.yml','r'))"
  register: omnia_yaml_validation
  changed_when: false

- name: Fail if YAML validation fails
  ansible.builtin.fail:
    msg: "{{ msg_yaml_validation_failed }}"
  when:
    - omnia_yaml_validation.rc != 0

- name: Display backup path (no-op when skipped)
  ansible.builtin.debug:
    msg: "{{ msg_using_backup_omnia_config }}"
  when: true

- name: Display transformation summary
  ansible.builtin.debug:
    msg: "{{ msg_omnia_config_transform_summary }}"


================================================
FILE: upgrade/roles/import_input_parameters/tasks/transform_provision_config.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Check if backup provision_config.yml exists
  ansible.builtin.stat:
    path: "{{ backup_location }}/provision_config.yml"
  register: backup_provision_config_stat

- name: Fail if backup provision_config.yml is not present
  ansible.builtin.fail:
    msg: "{{ msg_backup_provision_config_missing }}"
  when: not backup_provision_config_stat.stat.exists

- name: Check if provision_config.yml exists
  ansible.builtin.stat:
    path: "{{ input_project_dir }}/provision_config.yml"
  register: provision_config_stat

- name: Fail if provision_config.yml is not present
  ansible.builtin.fail:
    msg: "{{ msg_provision_config_missing }}"
  when: not provision_config_stat.stat.exists

- name: Read backup provision_config.yml (source of truth)
  ansible.builtin.slurp:
    src: "{{ backup_location }}/provision_config.yml"
  register: backup_provision_config_slurp

- name: Parse backup provision_config.yml
  ansible.builtin.set_fact:
    backup_provision_config: "{{ backup_provision_config_slurp.content | b64decode | from_yaml }}"

- name: Normalize provision_config.yml values
  ansible.builtin.set_fact:
    provision_pxe_mapping_file_path: "{{ backup_provision_config.pxe_mapping_file_path | default('pxe_mapping_file.csv') }}"
    provision_language: "{{ backup_provision_config.language | default('en_US.UTF-8') }}"
    provision_default_lease_time: "{{ backup_provision_config.default_lease_time | default('86400') }}"

- name: Fail if pxe_mapping_file_path is missing
  ansible.builtin.fail:
    msg: "{{ msg_pxe_mapping_file_path_missing }}"
  when: (provision_pxe_mapping_file_path | string | trim) == ''

- name: Write provision_config.yml in Omnia 2.1 format
  ansible.builtin.template:
    src: provision_config.j2
    dest: "{{ input_project_dir }}/provision_config.yml"
    mode: "{{ default_file_mode }}"
  vars:
    provision_pxe_mapping_file_path: "{{ provision_pxe_mapping_file_path }}"
    provision_language: "{{ provision_language }}"
    provision_default_lease_time: "{{ provision_default_lease_time }}"

- name: Validate YAML syntax of transformed provision_config.yml
  ansible.builtin.command:
    cmd: python3 -c "import yaml; yaml.safe_load(open('{{ input_project_dir }}/provision_config.yml','r'))"
  register: provision_yaml_validation
  changed_when: false

- name: Fail if YAML validation fails
  ansible.builtin.fail:
    msg: "{{ msg_yaml_validation_failed }}"
  when:
    - provision_yaml_validation.rc != 0

- name: Display backup path (no-op when skipped)
  ansible.builtin.debug:
    msg: "{{ msg_using_backup_provision_config }}"
  when: true

- name: Display transformation summary
  ansible.builtin.debug:
    msg: "{{ msg_provision_config_transform_summary }}"


================================================
FILE: upgrade/roles/import_input_parameters/tasks/transform_storage_config.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Check if backup storage_config.yml exists
  ansible.builtin.stat:
    path: "{{ backup_location }}/storage_config.yml"
  register: backup_storage_config_stat

- name: Fail if backup storage_config.yml is not present
  ansible.builtin.fail:
    msg: "{{ msg_backup_storage_config_missing }}"
  when: not backup_storage_config_stat.stat.exists

- name: Check if storage_config.yml exists
  ansible.builtin.stat:
    path: "{{ input_project_dir }}/storage_config.yml"
  register: storage_config_stat

- name: Fail if storage_config.yml is not present
  ansible.builtin.fail:
    msg: "{{ msg_storage_config_missing }}"
  when: not storage_config_stat.stat.exists

- name: Read backup storage_config.yml (source of truth)
  ansible.builtin.slurp:
    src: "{{ backup_location }}/storage_config.yml"
  register: backup_storage_config_slurp

- name: Parse backup storage_config.yml
  ansible.builtin.set_fact:
    backup_storage_config: "{{ backup_storage_config_slurp.content | b64decode | from_yaml }}"

- name: Normalize storage_config.yml values
  ansible.builtin.set_fact:
    storage_nfs_client_params: "{{ backup_storage_config.nfs_client_params | default([]) }}"

- name: Fail if nfs_client_params is missing
  ansible.builtin.fail:
    msg: "{{ msg_nfs_client_params_missing }}"
  when: (storage_nfs_client_params | default([]) | length) == 0

- name: Fail if any NFS client entry is missing required keys
  ansible.builtin.fail:
    msg: "{{ msg_nfs_client_param_entry_missing_keys }}"
  when: >-
    (storage_nfs_client_params | selectattr('server_ip', 'undefined') | list | length) > 0 or
    (storage_nfs_client_params | selectattr('server_share_path', 'undefined') | list | length) > 0 or
    (storage_nfs_client_params | selectattr('client_share_path', 'undefined') | list | length) > 0 or
    (storage_nfs_client_params | selectattr('client_mount_options', 'undefined') | list | length) > 0

- name: Write storage_config.yml in Omnia 2.1 format
  ansible.builtin.template:
    src: storage_config.j2
    dest: "{{ input_project_dir }}/storage_config.yml"
    mode: "{{ default_file_mode }}"
  vars:
    storage_nfs_client_params: "{{ storage_nfs_client_params }}"

- name: Validate YAML syntax of transformed storage_config.yml
  ansible.builtin.command:
    cmd: python3 -c "import yaml; yaml.safe_load(open('{{ input_project_dir }}/storage_config.yml','r'))"
  register: storage_yaml_validation
  changed_when: false

- name: Fail if YAML validation fails
  ansible.builtin.fail:
    msg: "{{ msg_yaml_validation_failed }}"
  when:
    - storage_yaml_validation.rc != 0

- name: Display backup path (no-op when skipped)
  ansible.builtin.debug:
    msg: "{{ msg_using_backup_storage_config }}"
  when: true

- name: Display transformation summary
  ansible.builtin.debug:
    msg: "{{ msg_storage_config_transform_summary }}"


================================================
FILE: upgrade/roles/import_input_parameters/tasks/transform_telemetry_config.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Check if backup telemetry_config.yml exists
  ansible.builtin.stat:
    path: "{{ backup_location }}/telemetry_config.yml"
  register: backup_telemetry_config_stat

- name: Fail if backup telemetry_config.yml is not present
  ansible.builtin.fail:
    msg: "{{ msg_backup_telemetry_config_missing }}"
  when: not backup_telemetry_config_stat.stat.exists

- name: Check if telemetry_config.yml exists
  ansible.builtin.stat:
    path: "{{ input_project_dir }}/telemetry_config.yml"
  register: telemetry_config_stat

- name: Fail if telemetry_config.yml is not present
  ansible.builtin.fail:
    msg: "{{ msg_telemetry_config_missing }}"
  when: not telemetry_config_stat.stat.exists

- name: Read backup telemetry_config.yml (source of truth)
  ansible.builtin.slurp:
    src: "{{ backup_location }}/telemetry_config.yml"
  register: backup_telemetry_config_slurp

- name: Parse backup telemetry_config.yml
  ansible.builtin.set_fact:
    backup_telemetry_config: "{{ backup_telemetry_config_slurp.content | b64decode | from_yaml }}"

- name: Normalize nested backup telemetry sections
  ansible.builtin.set_fact:
    backup_telemetry_victoria_config: "{{ backup_telemetry_config.victoria_configurations | default({}) }}"
    backup_telemetry_kafka_config: "{{ backup_telemetry_config.kafka_configurations | default({}) }}"

- name: Normalize telemetry_config.yml values
  ansible.builtin.set_fact:
    telemetry_idrac_telemetry_support: "{{ backup_telemetry_config.idrac_telemetry_support | default(true) }}"
    telemetry_idrac_telemetry_collection_type: >-
      {{
        backup_telemetry_config.idrac_telemetry_collection_type
        | default('victoria,kafka')
      }}
    telemetry_victoria_deployment_mode: "{{ backup_telemetry_victoria_config.deployment_mode | default('cluster') }}"
    telemetry_victoria_persistence_size: "{{ backup_telemetry_victoria_config.persistence_size | default('8Gi') }}"
    telemetry_victoria_retention_period: "{{ backup_telemetry_victoria_config.retention_period | default(168) }}"
    telemetry_kafka_persistence_size: "{{ backup_telemetry_kafka_config.persistence_size | default('8Gi') }}"
    telemetry_kafka_log_retention_hours: "{{ backup_telemetry_kafka_config.log_retention_hours | default(168) }}"
    telemetry_kafka_log_retention_bytes: "{{ backup_telemetry_kafka_config.log_retention_bytes | default(-1) }}"
    telemetry_kafka_log_segment_bytes: "{{ backup_telemetry_kafka_config.log_segment_bytes | default(1073741824) }}"
    telemetry_kafka_topic_partitions: >-
      {{
        backup_telemetry_kafka_config.topic_partitions
        | default([
          {'name': 'idrac', 'partitions': 1},
          {'name': 'ldms', 'partitions': 2}
        ])
      }}
    telemetry_ldms_agg_port: "{{ backup_telemetry_config.ldms_agg_port | default(6001) }}"
    telemetry_ldms_store_port: "{{ backup_telemetry_config.ldms_store_port | default(6001) }}"
    telemetry_ldms_sampler_port: "{{ backup_telemetry_config.ldms_sampler_port | default(10001) }}"
    telemetry_ldms_sampler_configurations: >-
      {{
        backup_telemetry_config.ldms_sampler_configurations
        | default([
          {
            'plugin_name': 'meminfo',
            'config_parameters': '',
            'activation_parameters': 'interval=1000000'
          },
          {
            'plugin_name': 'procstat2',
            'config_parameters': '',
            'activation_parameters': 'interval=1000000'
          },
          {
            'plugin_name': 'vmstat',
            'config_parameters': '',
            'activation_parameters': 'interval=1000000'
          },
          {
            'plugin_name': 'loadavg',
            'config_parameters': '',
            'activation_parameters': 'interval=1000000'
          },
          {
            'plugin_name': 'procnetdev2',
            'config_parameters': '',
            'activation_parameters': 'interval=1000000 offset=0'
          }
        ])
      }}

- name: Write telemetry_config.yml in Omnia 2.1 format
  ansible.builtin.template:
    src: telemetry_config.j2
    dest: "{{ input_project_dir }}/telemetry_config.yml"
    mode: "{{ default_file_mode }}"
  vars:
    telemetry_idrac_telemetry_support: "{{ telemetry_idrac_telemetry_support }}"
    telemetry_idrac_telemetry_collection_type: "{{ telemetry_idrac_telemetry_collection_type }}"
    telemetry_victoria_deployment_mode: "{{ telemetry_victoria_deployment_mode }}"
    telemetry_victoria_persistence_size: "{{ telemetry_victoria_persistence_size }}"
    telemetry_victoria_retention_period: "{{ telemetry_victoria_retention_period }}"
    telemetry_kafka_persistence_size: "{{ telemetry_kafka_persistence_size }}"
    telemetry_kafka_log_retention_hours: "{{ telemetry_kafka_log_retention_hours }}"
    telemetry_kafka_log_retention_bytes: "{{ telemetry_kafka_log_retention_bytes }}"
    telemetry_kafka_log_segment_bytes: "{{ telemetry_kafka_log_segment_bytes }}"
    telemetry_kafka_topic_partitions: "{{ telemetry_kafka_topic_partitions }}"
    telemetry_ldms_agg_port: "{{ telemetry_ldms_agg_port }}"
    telemetry_ldms_store_port: "{{ telemetry_ldms_store_port }}"
    telemetry_ldms_sampler_port: "{{ telemetry_ldms_sampler_port }}"
    telemetry_ldms_sampler_configurations: "{{ telemetry_ldms_sampler_configurations }}"

- name: Validate YAML syntax of transformed telemetry_config.yml
  ansible.builtin.command:
    cmd: python3 -c "import yaml; yaml.safe_load(open('{{ input_project_dir }}/telemetry_config.yml','r'))"
  register: telemetry_yaml_validation
  changed_when: false

- name: Fail if YAML validation fails
  ansible.builtin.fail:
    msg: "{{ msg_yaml_validation_failed }}"
  when:
    - telemetry_yaml_validation.rc != 0

- name: Display backup path (no-op when skipped)
  ansible.builtin.debug:
    msg: "{{ msg_using_backup_telemetry_config }}"
  when: true

- name: Display transformation summary
  ansible.builtin.debug:
    msg: "{{ msg_telemetry_config_transform_summary }}"


================================================
FILE: upgrade/roles/import_input_parameters/templates/high_availability_config.j2
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# ***********************************************************************
# High Availability (HA) Configuration for Kubernetes (K8s) Service Node(List)
# - cluster_name is required field it should match one of the values defined in omnia_config.yml where deployment is set to true.
# - enable_k8s_ha: <Mandatory> Indicates whether to enable HA for the Kubernetes (K8s) service node. Set to 'true' to enable, 'false' to disable.
# - virtual_ip_address: <Mandatory> The virtual IP address for the K8s service node setup.
# ***********************************************************************

{{ {'service_k8s_cluster_ha': ha_service_k8s_cluster_ha} | to_nice_yaml(indent=2) }}


================================================
FILE: upgrade/roles/import_input_parameters/templates/local_repo_config.j2
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# You may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# ================================
# VARIABLE DETAILS
# ================================
# 1. user_registry
#--------------------------
# Configuration for user registry to configure additional images in Pulp
# Fields:
#   host       : Registry IP and port in format "IP:port"
#   cert_path  : Path to SSL certificate file (.crt) - Required only if host is using HTTPS
#   key_path   : Path to SSL private key file (.key) - Required only if host is using HTTPS
# Notes:
#   - If host is HTTPS, cert_path and key_path are required
#   - If host is HTTP, cert_path and key_path can be left empty
#   - cert_path should point to .crt files only
#   - key_path should point to .key files only
#   - cert and key paths are accessed from within the omnia_core container
# 2. user_repo_url_x86_64
#--------------------------
#    Optional list of user-defined repository URLs for x86_64 architecture.
#    Each entry can include: url, gpgkey, sslcacert, sslclientkey, sslclientcert, name, policy.
#    Used for custom cluster packages like <arch>_slurm_custom.
# Fields:
#   url         : Base URL of the repository
#   gpgkey      : GPG key URL (leave empty to disable gpgcheck; Omnia will trust this repo and user is responsible for its security)
#   name        : Name of the repository (must start with 'x86_64_', e.g., 'x86_64_my_repo')
#   sslcacert   : Path to SSL CA certificate (if using SSL)
#   sslclientkey: Path to SSL client key (if using SSL)
#   sslclientcert: Path to SSL client certificate (if using SSL)
#   policy      : Repository sync policy. Allowed values: always, partial (OPTIONAL)
#                   If not provided, uses repo_config from software_config.json
#   caching     : Enable or disable local caching. Allowed values: true, false (OPTIONAL)
#                   If not provided, defaults to true
# Notes:
#   - Do not use Jinja variables in this configuration.
#   - Omit SSL fields entirely if SSL is not in use.
#   - Its a madatory field in case of slurm_custom with name as '<arch>_slurm_custom'
#
# 3. user_repo_url_aarch64
#---------------------------
#    Same as above but for aarch64 architecture.
#    Note: name must start with 'aarch64_' (e.g., 'aarch64_my_repo').
#
# 4. rhel_os_url_x86_64
#-----------------------------
#    Mandatory when RHEL subscription is not registered.
#    Contains repository URLs for codeready-builder, baseos, and appstream for x86_64.
# Fields:
#   url         : Base URL of the repository
#   gpgkey      : GPG key URL (leave empty to disable gpgcheck; Omnia will trust this repo and user is responsible for its security)
#   sslcacert   : Path to SSL CA certificate (if using SSL)
#   sslclientkey: Path to SSL client key (if using SSL)
#   sslclientcert: Path to SSL client certificate (if using SSL)
#   policy      : Repository policy if mentioned allowed values (always, partial). 
#                   If not provided, uses repo_config from software_config.json
#   caching     : Enable or disable local caching. Allowed values: true, false (OPTIONAL)
#                   If not provided, defaults to true
#   name        : Name of the repository [ Allowed repo names <arch>_codeready-builder, <arch>_appstream, <arch>_baseos
# Notes:
#   - Do not use Jinja variables in this configuration.
#   - Omit SSL fields entirely if SSL is not in use.
#   - RHEL subscription is not registered, All 3 repositories [ <arch>_codeready-builder, <arch>_appstream, <arch>_baseos ]entries
#      are mandatory.
#
# 5. rhel_os_url_aarch64
#----------------------------
#    Same as above but for aarch64 architecture.
#
# 6. rhel_subscription_repo_config_x86_64
#-------------------------------------------
#    Optional configuration for overriding policy and caching settings for RHEL 
#    subscription-based repositories on x86_64 architecture.
#    When subscription is enabled, this config takes precedence over dynamically 
#    generated URLs for matching repositories and adds any additional repositories.
# Fields:
#   url         : Base URL of the repository (REQUIRED)
#   gpgkey      : GPG key URL (REQUIRED, can be empty to disable gpgcheck)
#   name        : Repository name for matching (REQUIRED)
#   policy      : Repository sync policy. Allowed values: always, partial (OPTIONAL)
#                   If not provided, uses repo_config from software_config.json
#   caching     : Enable or disable local caching. Allowed values: true, false (OPTIONAL)
#                   If not provided, defaults to true
#   sslcacert   : Path to SSL CA certificate (optional)
#   sslclientkey: Path to SSL client key (optional)
#   sslclientcert: Path to SSL client certificate (optional)
# Notes:
#   - Do not use Jinja variables in this configuration.
#   - Omit SSL fields entirely if SSL is not in use.
#   - Matching is done by repository name (e.g., x86_64_appstream)
#   - Non-matching repositories are added as additional repos
#
# 7. rhel_subscription_repo_config_aarch64
#--------------------------------------------
#    Same as above but for aarch64 architecture.
#
#### ADVANCE CONFIGURATIONS FOR LOCAL REPO ###
# 8. omnia_repo_url_rhel_x86_64
#-------------------------------
#    Mandatory repository URLs for downloading RPMS for Omnia features on RHEL x86_64.
#    Each entry includes url, gpgkey, and name.
#
# This variable defines all the repo urls from where rpms will be downloaded for omnia features when cluster_os_type is rhel and arch x86_64
# Making incorrect changes to this variable can cause omnia failure. Please edit cautiously.
# Fields:
#  url        : Base URL of the repository.
#  gpgkey     : URL of the GPG key for the repository.
#                   If left empty, gpgcheck=0 for that repository.
#  name       : A unique identifier for the repository or registry.
#  policy      : Repository sync policy. Allowed values: always, partial (OPTIONAL)
#                   If not provided, uses repo_config from software_config.json
#  caching     : Enable or disable local caching. Allowed values: true, false (OPTIONAL)
#                   If not provided, defaults to true
# 9. omnia_repo_url_rhel_aarch64
#--------------------------------
#    Same as above but for RHEL aarch64.
#
# 10. additional_repos_x86_64
#----------------------------
#    Optional list of additional repository URLs for x86_64 architecture.
#    These repos are aggregated into a single Pulp repository, allowing dynamic
#    addition/removal without changing compute node configurations.
# Fields:
#   url           : Base URL of the repository (required)
#   gpgkey        : GPG key URL (required, can be empty - disables gpgcheck)
#   name          : Unique name for the repository (required)
#   sslcacert     : Path to SSL CA certificate (optional)
#   sslclientkey  : Path to SSL client key (optional)
#   sslclientcert : Path to SSL client certificate (optional)
#   policy      : Repository sync policy. Allowed values: always, partial (OPTIONAL)
#                   If not provided, uses repo_config from software_config.json
#   caching     : Enable or disable local caching. Allowed values: true, false (OPTIONAL)
#                   If not provided, defaults to true
# Notes:
#   - All repos are synced into a single aggregated Pulp repository
#   - Compute nodes are configured once with a fixed URL that never changes
#   - Policy is controlled globally via repo_config in software_config.json (per-entry policy not supported)
#   - Name must be unique within this list and must not conflict with names in other repo keys
#   - Packages from these repos can only be used via additional_packages.json
#
# 11. additional_repos_aarch64
#-----------------------------
#    Same as above but for aarch64 architecture.

# ================================
# VARIABLES
# ================================
# user_registry:
#    - { host: "172.16.107.254:4000", cert_path: "/opt/omnia/domain.crt", key_path: "/opt/omnia/domain.key" }
user_registry:
{% set _user_registry = local_repo_user_registry | default([]) %}
{% if (_user_registry | length) > 0 %}
{% for _reg in _user_registry %}
  - { host: {{ (_reg.host | default('')) | to_json }}, cert_path: {{ (_reg.cert_path | default('')) | to_json }}, key_path: {{ (_reg.key_path | default('')) | to_json }} }
{% endfor %}
{% endif %}
# user_repo_url_x86_64:
#  - { url: "", gpgkey: "", sslcacert: "", sslclientkey: "", sslclientcert: "",  name: "x86_64_slurm_custom" }
user_repo_url_x86_64:
{% set _user_repo_url_x86_64 = local_repo_user_repo_url_x86_64 | default([]) %}
{% if (_user_repo_url_x86_64 | length) > 0 %}
{% for _repo in _user_repo_url_x86_64 %}
  - { url: {{ (_repo.url | default('')) | to_json }}, gpgkey: {{ (_repo.gpgkey | default('')) | to_json }}, sslcacert: {{ (_repo.sslcacert | default('')) | to_json }}, sslclientkey: {{ (_repo.sslclientkey | default('')) | to_json }}, sslclientcert: {{ (_repo.sslclientcert | default('')) | to_json }}, name: {{ (_repo.name | default('')) | to_json }} }
{% endfor %}
{% endif %}
user_repo_url_aarch64:
{% set _user_repo_url_aarch64 = local_repo_user_repo_url_aarch64 | default([]) %}
{% if (_user_repo_url_aarch64 | length) > 0 %}
{% for _repo in _user_repo_url_aarch64 %}
  - { url: {{ (_repo.url | default('')) | to_json }}, gpgkey: {{ (_repo.gpgkey | default('')) | to_json }}, sslcacert: {{ (_repo.sslcacert | default('')) | to_json }}, sslclientkey: {{ (_repo.sslclientkey | default('')) | to_json }}, sslclientcert: {{ (_repo.sslclientcert | default('')) | to_json }}, name: {{ (_repo.name | default('')) | to_json }} }
{% endfor %}
{% endif %}
#Example:
# rhel_os_url_x86_64:
#  - { url: "http://crb.com/CRB/x86_64/os/", gpgkey: "http://crb.com/CRB/x86_64/os/RPM-GPG-KEY", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "x86_64_codeready-builder"}
#  - { url: "http://BaseOS.com/BaseOS/x86_64/os/", gpgkey: "http://BaseOS.com/BaseOS/x86_64/os/RPM-GPG-KEY", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "x86_64_baseos"}
#  - { url: "http://AppStream.com/AppStream/x86_64/os/", gpgkey: "http://AppStream.com/AppStream/x86_64/os/RPM-GPG-KEY", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "x86_64_appstream" }
rhel_os_url_x86_64:
{% set _rhel_os_url_x86_64 = local_repo_rhel_os_url_x86_64 | default([]) %}
{% if (_rhel_os_url_x86_64 | length) > 0 %}
{% for _repo in _rhel_os_url_x86_64 %}
  - { url: {{ (_repo.url | default('')) | to_json }}, gpgkey: {{ (_repo.gpgkey | default('')) | to_json }}, sslcacert: {{ (_repo.sslcacert | default('')) | to_json }}, sslclientkey: {{ (_repo.sslclientkey | default('')) | to_json }}, sslclientcert: {{ (_repo.sslclientcert | default('')) | to_json }}, name: {{ (_repo.name | default('')) | to_json }} }
{% endfor %}
{% endif %}
rhel_os_url_aarch64:
{% set _rhel_os_url_aarch64 = local_repo_rhel_os_url_aarch64 | default([]) %}
{% if (_rhel_os_url_aarch64 | length) > 0 %}
{% for _repo in _rhel_os_url_aarch64 %}
  - { url: {{ (_repo.url | default('')) | to_json }}, gpgkey: {{ (_repo.gpgkey | default('')) | to_json }}, sslcacert: {{ (_repo.sslcacert | default('')) | to_json }}, sslclientkey: {{ (_repo.sslclientkey | default('')) | to_json }}, sslclientcert: {{ (_repo.sslclientcert | default('')) | to_json }}, name: {{ (_repo.name | default('')) | to_json }} }
{% endfor %}
{% endif %}
# Example:
# rhel_subscription_repo_config_x86_64:
#  - { url: "https://example.com/appstream", gpgkey: "", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "x86_64_appstream", policy: "always", caching: true }
#  - { url: "https://cdn.redhat.com/content/dist/rhel10/10.0/x86_64/supplementary/os/", gpgkey: "file:///etc/pki/rpm-gpg/RPM-GPG-KEY-redhat-release", sslcacert: "", sslclientkey: "", sslclientcert: "", name: "x86_64_supplementary", policy: "always", caching: false }
rhel_subscription_repo_config_x86_64:
rhel_subscription_repo_config_aarch64:
# Making incorrect changes to this variable can cause omnia failure. Please edit cautiously.
omnia_repo_url_rhel_x86_64:
  - { url: "https://download.docker.com/linux/centos/10/x86_64/stable/", gpgkey: "https://download.docker.com/linux/centos/gpg", name: "docker-ce"}
  - { url: "https://dl.fedoraproject.org/pub/epel/10/Everything/x86_64/", gpgkey: "https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-10", name: "epel"}
  - { url: "https://pkgs.k8s.io/core:/stable:/v1.34/rpm/", gpgkey: "https://pkgs.k8s.io/core:/stable:/v1.34/rpm/repodata/repomd.xml.key", name: "kubernetes"}
  - { url: "https://download.opensuse.org/repositories/isv:/cri-o:/stable:/v1.34/rpm/", gpgkey: "https://download.opensuse.org/repositories/isv:/cri-o:/stable:/v1.34/rpm/repodata/repomd.xml.key", name: "cri-o"}
  - { url: "https://linux.mellanox.com/public/repo/doca/3.2.1/rhel10/x86_64/", gpgkey: "https://linux.mellanox.com/public/repo/doca/3.2.1/rhel10/x86_64/repodata/repomd.xml.key", name: "doca"}
omnia_repo_url_rhel_aarch64:
  - { url: "https://download.docker.com/linux/centos/10/aarch64/stable/", gpgkey: "https://download.docker.com/linux/centos/gpg", name: "docker-ce"}
  - { url: "https://dl.fedoraproject.org/pub/epel/10/Everything/aarch64/", gpgkey: "https://dl.fedoraproject.org/pub/epel/RPM-GPG-KEY-EPEL-10", name: "epel"}
  - { url: "https://linux.mellanox.com/public/repo/doca/3.2.1/rhel10/arm64-sbsa/", gpgkey: "https://linux.mellanox.com/public/repo/doca/3.2.1/rhel10/arm64-sbsa/repodata/repomd.xml.key", name: "doca"}
# Example:
# additional_repos_x86_64:
#  - { url: "https://rpm.grafana.com/", gpgkey: "", name: "grafana" }
#  - { url: "https://repo.example.com/x86_64/", gpgkey: "", name: "custom-repo", sslcacert: "/path/ca.crt", sslclientkey: "/path/client.key", sslclientcert: "/path/client.crt" }
additional_repos_x86_64:
{% set _additional_repos_x86_64 = local_repo_additional_repos_x86_64 | default([]) %}
{% if (_additional_repos_x86_64 | length) > 0 %}
{% for _repo in _additional_repos_x86_64 %}
  - { url: {{ (_repo.url | default('')) | to_json }}, gpgkey: {{ (_repo.gpgkey | default('')) | to_json }}, name: {{ (_repo.name | default('')) | to_json }}, sslcacert: {{ (_repo.sslcacert | default('')) | to_json }}, sslclientkey: {{ (_repo.sslclientkey | default('')) | to_json }}, sslclientcert: {{ (_repo.sslclientcert | default('')) | to_json }} }
{% endfor %}
{% endif %}
additional_repos_aarch64:
{% set _additional_repos_aarch64 = local_repo_additional_repos_aarch64 | default([]) %}
{% if (_additional_repos_aarch64 | length) > 0 %}
{% for _repo in _additional_repos_aarch64 %}
  - { url: {{ (_repo.url | default('')) | to_json }}, gpgkey: {{ (_repo.gpgkey | default('')) | to_json }}, name: {{ (_repo.name | default('')) | to_json }}, sslcacert: {{ (_repo.sslcacert | default('')) | to_json }}, sslclientkey: {{ (_repo.sslclientkey | default('')) | to_json }}, sslclientcert: {{ (_repo.sslclientcert | default('')) | to_json }} }
{% endfor %}
{% endif %}


================================================
FILE: upgrade/roles/import_input_parameters/templates/network_spec.j2
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# This file is used to specify the network configuration.
#
# 'admin_network' is a mandatory field, essential for PXE boot and host communication."
#
# The 'admin_network' section contains the following variables:
# - 'oim_nic_name': The name of the interface on the OIM server associated with the admin network.
# - 'netmask_bits': The number of bits in the subnet mask.
# - 'primary_oim_admin_ip': The admin IP address of the OIM server which is configured.
# - 'primary_oim_bmc_ip': The iDRAC  IP address of the OIM server,
#     Mandatory only if idrac_telemetry is set to true and telemetry data needs to be collected from the OIM server.
#     Optional — can be omitted if iDRAC telemetry for the OIM server is not required.
# - 'dynamic_range': The range of dynamic IP addresses available on the admin network.
# - 'dns': The list of external DNS server IP address for the admin network.
# - 'ntp_servers': The list of NTP servers for the admin network. Each NTP server entry should include: 
#     - 'address': The IP address or hostname of the NTP server.
#     - 'type': The type of NTP entry, either 'server' or 'pool'.
#     Example:  
#     ntp_servers:
#       - { address: "172.16.10.80", type: "server" }

# 'ib_network' is a mandatory field, essential for IB network configuration.
# The 'ib_network' section contains the following variables:
# - 'subnet': The subnet of the IB network.
# - 'netmask_bits': The number of bits in the subnet mask. This value must be same as the admin_network netmask_bits.

Networks:
- admin_network:
    oim_nic_name: "{{ admin_network.oim_nic_name | default('') }}"
    netmask_bits: "{{ admin_network.netmask_bits | default('24') }}"
    primary_oim_admin_ip: "{{ admin_network.primary_oim_admin_ip | default('') }}"
    primary_oim_bmc_ip: "{{ admin_network.primary_oim_bmc_ip | default('') }}"
    dynamic_range: "{{ admin_network.dynamic_range | default('') }}"
    dns: {{ admin_network.dns | default([]) }}
    ntp_servers: {{ admin_network.ntp_servers | default([]) }}

- ib_network:
    subnet: "{{ ib_network.subnet | default('192.168.0.0') }}"
    netmask_bits: "{{ ib_network.netmask_bits | default(admin_network_netmask_bits | default('24')) }}"


================================================
FILE: upgrade/roles/import_input_parameters/templates/omnia_config.j2
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# -----------------------------SLURM------------------------------------------------
# slurm_cluster
# List of slurm clusters
# cluster_name is required field

# nfs_storage_name
# Storage name corresponding to the NFS share to be used by slurm cluster 
# This should match with exactly with a entry in storage_config.yml

# skip_merge
# Variable indicates whether a specific configuration file path
# under config_sources should be used as-is without merging
# If skip_merge is set to true for a configuration source path,
# that configuration file will be applied directly
# without merging with defaults or existing configurations
# It accepts true and false values
# Default value is false

# node_discovery_mode
# Controls how hardware specifications are discovered for Slurm compute nodes
# Options: "heterogeneous" or "homogeneous"
# - heterogeneous: Discovers each node individually via iDRAC (1 call per node)
#   Best for: Mixed hardware environments with different node configurations
# - homogeneous: Groups nodes by hardware type for optimized discovery
#   Best for: Standardized hardware groups (grp0-grp100 in pxe_mapping_file.csv)
#   Performance: 0 iDRAC calls (with specs) or 1 call per group (without specs)
# Default value is heterogeneous

# node_hardware_defaults
# Optional: Pre-define hardware specifications for homogeneous node groups
# Only used when node_discovery_mode is set to "homogeneous"
# Key: GROUP_NAME from pxe_mapping_file.csv (e.g., grp0, grp1, grp2, etc.)
# Value: Hardware specifications for all nodes in that group
#   - sockets: Number of CPU sockets per node (integer, minimum 1)
#   - cores_per_socket: Number of CPU cores per socket (integer, minimum 1)
#   - threads_per_core: Number of CPU threads per core (integer, minimum 1)
#   - real_memory: Memory in MB (integer, minimum 1)
#   - gres: Optional GPU resources in format "gpu:N" (e.g., "gpu:4")
# If a group is not listed here, one node from that group will be discovered via iDRAC
# and the specs will be applied to all nodes in the group
# Example:
#   node_hardware_defaults:
#     grp1:
#       sockets: 2
#       cores_per_socket: 64
#       threads_per_core: 2
#       real_memory: 512000
#       gres: "gpu:4"
#     grp2:
#       sockets: 2
#       cores_per_socket: 32
#       threads_per_core: 2
#       real_memory: 256000

# config_sources
# defines how the Slurm configuration files are provided to the cluster.
# <conf name>: 
#    <mapping> or <filepath>
# <mapping> Supply the configuration values directly as a key–value map
# <filepath> Supply the absolute path to a custom configuration file
#            This path can be any path inside the omnia_core container.
#            The default input path "/opt/omnia/input/project_default" 
#            can also be used to place the custom conf files
# Example (slurm mapping):
#   config_sources:
#     slurm:
#       SlurmctldTimeout: 60
#       SlurmdTimeout: 150
#       NodeName:
#         - NodeName: node1
#           CPUs: 16
#           RealMemory: 64000
#         - NodeName: node2
#           CPUs: 16
#           RealMemory: 64000
# The conf files supported by slurm are
# slurm
# cgroup
# slurmdbd
# gres
# acct_gather
# helpers
# job_container
# mpi
# oci
# topology
# burst_buffer
# Thes files will be written into the slurm_config directory with .conf suffix

slurm_cluster:
{% set _slurm_cluster = omnia_slurm_cluster | default([]) %}
{% if (_slurm_cluster | length) > 0 %}
{% for _cluster in _slurm_cluster %}
  - cluster_name: {{ _cluster.cluster_name | default('') }}
    nfs_storage_name: {{ _cluster.nfs_storage_name | default('') }}
    # skip_merge: False

    # Uncomment to enable homogeneous discovery mode
    # node_discovery_mode: "homogeneous"

    # # Optional hardware specs per group (if omitted, one node per group is discovered via iDRAC)
    # node_hardware_defaults:
    #   grp1:
    #     sockets: 2
    #     cores_per_socket: 64
    #     threads_per_core: 2
    #     real_memory: 512000
    #     gres: "gpu:4"
    #   grp2:
    #     sockets: 2
    #     cores_per_socket: 32
    #     threads_per_core: 2
    #     real_memory: 256000

{% if _cluster.config_sources is defined and (_cluster.config_sources | length > 0) %}

    config_sources:
{% for _conf_name, _conf_val in _cluster.config_sources.items() %}
{% if _conf_val is mapping %}
      {{ _conf_name }}:
{% for _k, _v in _conf_val.items() %}
        {{ _k }}: {{ _v }}
{% endfor %}
{% else %}
      {{ _conf_name }}: {{ _conf_val }}
{% endif %}
{% endfor %}
    #   OR

    # config_sources:
    #   slurm: /path/to/custom_slurm.conf
    #   cgroup: /path/to/custom_cgroup.conf
    #   slurmdbd: /path/to/custom_slurmdbd.conf
    #   gres: /path/to/custom_gres.conf
{% else %}

    # config_sources:
    #   slurm:
    #     SlurmctldTimeout: 60
    #     SlurmdTimeout: 150
    #     NodeName:
    #       - NodeName: newnode1
    #         CPUs: 16
    #         RealMemory: 64000
    #       - NodeName: newnode2
    #         CPUs: 16
    #         RealMemory: 64000
    #   cgroup:
    #     CgroupPlugin: autodetect
    #     ConstrainCores: True
    #     ConstrainDevices: True
    #     ConstrainRAMSpace: True
    #     ConstrainSwapSpace: True

    #   OR

    # config_sources:
    #   slurm: /path/to/custom_slurm.conf
    #   cgroup: /path/to/custom_cgroup.conf
    #   slurmdbd: /path/to/custom_slurmdbd.conf
    #   gres: /path/to/custom_gres.conf
{% endif %}
{% endfor %}
{% endif %}


# ----------------------------SERVICE K8S------------------------------------------------------
# For service k8s cluster below parameters are required,(List)
# - cluster_name is required field

# - deployment: Exactly one entry in both the service_k8s_cluster lists must have deployment set to true to indicate where Kubernetes should be deployed.
# Please ensure corresponding cluster entry is added to high_availability_config.yml if deployment is set to true. 

# - Kubernetes SDN network.K8s_cni (Mandatory) - It can either be "calico" or "flannel".Default value assigned is "calico".
# While setting up Kubernetes plugin for RoCE NIC, ensure that this value is set to "flannel"

# - pod_external_ip_range: (Mandatory) These addresses will be used by Loadbalancer for assigning External IPs to K8s services
# Make sure the IP range is not assigned to any node in the cluster.
# Acceptable formats: "10.11.0.100-10.11.0.150" , "10.11.0.0/16"

# - k8s_service_addresses: Kubernetes internal network for services.This network must be unused in your network infrastructure.
# Default value is "10.233.0.0/18"

# - k8s_pod_network_cidr: Kubernetes pod network CIDR for internal network. When used, it will assign IP addresses from this range to individual pods.
# This network must be unused in your network infrastructure.
# Default value is "10.233.64.0/18"

# nfs_storage_name : The nfs name should be same as one of the nfs name defined in storage_config.yml to configure the server.
# ----------------------------CSI Driver------------------------------------------------------
# Following csi powerscale driver input variables are mandatory only if csi_driver_powerscale entry is present in software_config.json
# csi_powerscale_driver_secret_file_path: Absolute file path for the secret.yaml file.
# User need to download secret.yaml file and fill required data in secret file. Provided the path of the secret file here.
# File path for the values.yml file which will contain the Powerscale driver configuration parameters.
# csi_powerscale_driver_values_file_path: User need to download values.yaml file and fill required data in values.yaml file. 
# Provided the path of the values.yaml file here. mention configurable values

# - k8s_crio_storage_size: Specifies the disk size allocated for CRI-O container storage.
# This storage is used to store container images, writable layers, and runtime data.
# Acceptable formats: "10G", "15G", "50G" (Only positive values in Gigabytes are allowed)
# Default value is "20G"


service_k8s_cluster:
{% set _service_k8s_cluster = omnia_service_k8s_cluster | default([]) %}
{% if (_service_k8s_cluster | length) > 0 %}
{% for _cluster in _service_k8s_cluster %}
  - cluster_name: {{ _cluster.cluster_name | default('') }}
    deployment: {{ _cluster.deployment | default(false) }}
    k8s_cni: {{ _cluster.k8s_cni | default('calico') }}
    pod_external_ip_range: "{{ _cluster.pod_external_ip_range | default('') }}"
    k8s_service_addresses: "{{ _cluster.k8s_service_addresses | default('') }}"
    k8s_pod_network_cidr: "{{ _cluster.k8s_pod_network_cidr | default('') }}"
    nfs_storage_name: "{{ _cluster.nfs_storage_name | default('') }}"
    csi_powerscale_driver_secret_file_path: "{{ _cluster.csi_powerscale_driver_secret_file_path | default('') }}"
    csi_powerscale_driver_values_file_path: "{{ _cluster.csi_powerscale_driver_values_file_path | default('') }}"
    k8s_crio_storage_size: {{ _cluster.k8s_crio_storage_size | default('20G') }}
{% endfor %}
{% endif %}


================================================
FILE: upgrade/roles/import_input_parameters/templates/omnia_config_credentials.yml.j2
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# Provision credentials
provision_password: "{{ provision_password | default('') }}"
bmc_username: "{{ bmc_username | default('') }}"
bmc_password: "{{ bmc_password | default('') }}"

# Prepare_oim credentials
minio_s3_password: "{{ minio_s3_password | default('') }}"
pulp_password: "{{ pulp_password | default('') }}"
docker_username: "{{ docker_username | default('') }}"
docker_password: "{{ docker_password | default('') }}"

# Omnia credentials
slurm_db_password: "{{ slurm_db_password | default('') }}"

# Security credentials
openldap_db_username: "{{ openldap_db_username | default('') }}"
openldap_db_password: "{{ openldap_db_password | default('') }}"

# iDrac Telemetry credentials
mysqldb_user: "{{ mysqldb_user | default('') }}"
mysqldb_password: "{{ mysqldb_password | default('') }}"
mysqldb_root_password: "{{ mysqldb_root_password | default('') }}"

# csi powerscale credentials
csi_username: "{{ csi_username | default('') }}"
csi_password: "{{ csi_password | default('') }}"

# LDMS sampler
ldms_sampler_password: "{{ ldms_sampler_password | default('') }}"

# postgres credentials
postgres_user: "{{ postgres_user | default('') }}"
postgres_password: "{{ postgres_password | default('') }}"

# Gitlab credentials
gitlab_root_password: "{{ gitlab_root_password | default('') }}"


================================================
FILE: upgrade/roles/import_input_parameters/templates/provision_config.j2
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

#### Mandatory
# This depicts the path where user has kept the PXE mapping file.
# The mapping file consists of the Service tag, Admin MAC,Hostname and its respective admin IP address and/or BMC IP.
# Ensure that admin IPs given in mapping file are within the network defined in the network_spec.yml
# A templates for mapping file exists in omnia/examples, namely, pxe_mapping_file.csv
# Format of csv: FUNCTIONAL_GROUP_NAME,GROUP_NAME,SERVICE_TAG,HOSTNAME,ADMIN_MAC,ADMIN_IP,BMC_MAC,BMC_IP
pxe_mapping_file_path: "{{ provision_pxe_mapping_file_path }}"

#### Mandatory
# Language that needs to be set during OS provisioning.
# Only language supported is "en_US.UTF-8"
language: "{{ provision_language }}"

#### Mandatory
# Default lease time needs to be used by DHCP
# Unit: seconds
# Min: 21600
# Default: 86400
# Max: 31536000
default_lease_time: "{{ provision_default_lease_time }}"


================================================
FILE: upgrade/roles/import_input_parameters/templates/storage_config.j2
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# -----------------------------Powervault-------------------------------------------
# powervault_config
# ip: ipv4
# A list of PowerVault controller IP addresses used for iSCSI target discovery and login.
# In this configuration, a single controller portal is provided.

# port:
# Defines the TCP port for the iSCSI target service.
# Port 3260 is the standard port for iSCSI communication.

# isci_initiators:
# Specifies the InitiatorName used by the host when connecting to the iSCSI target.
# This IQN uniquely identifies the host to the storage array.

# volume_id:
# This is the unique WWN/identifier for the
# specific volume that should be used for persistent storage.
# The script uses this value during multipath scanning to select the correct mapped device

#powervault_config:
#  ip:
#    - 172.1.2.3
#  port: 3260
#  isci_initiators: iqn.initiator.com.example:7d7d7d7d7d7
#  volume_id: 00c0ff4343f1f1f1001c8c4e6901000000

# -----------------------------NFS------------------------------------------------

# This variable is used for mounting NFS share on slurm_control_node, slurm_node, login_node
# This takes a list of dicts with possible keys server_ip, server_share_path, client_share_path, client_mount_options
# In both the cases, the USER must manually update 'server_ip' and 'server_share_path' below with the correct values.
# If mount_option values are empty, NFS client will be mounted with these values "nosuid,rw,sync,hard,intr"
# Its mandatory to provide atleast one entry in nfs_client_params
# Example for single mount file system:
# nfs_client_params:
# nfs_name : str ,Name of the NFS storage resource. The default is "nfs_storage_default".
#     The user can assign any custom string to specify a different NFS storage resource.
# - { server_ip: 10.5.0.101, server_share_path: "/mnt/share", client_share_path: "/home", client_mount_options: "nosuid,rw,sync,hard"}
# Example for supporting multiple mount points:
# nfs_client_params:
# - { server_ip: 198.168.0.1,server_share_path: "/mnt/share1", client_share_path: "/home", client_mount_options: "nosuid,rw,sync,hard"}
# - { server_ip: 198.168.0.2, server_share_path: "/mnt/share2", client_share_path: "/mnt/mount2", client_mount_options: "nosuid,rw,sync,hard"}
# Example for multiple mount file system:
# nfs_client_params:
# - { server_ip: 198.168.0.1, server_share_path: "/mnt/share1", client_share_path: "/mnt/mount1", client_mount_options: "nosuid,rw,sync,hard"}
# - { server_ip: 198.168.0.2, server_share_path: "/mnt/share2", client_share_path: "/mnt/mount2", client_mount_options: "nosuid,rw,sync,hard"}

nfs_client_params:
{% set _nfs = storage_nfs_client_params | default([]) %}
{% for _entry in _nfs %}
  - server_ip: "{{ _entry.server_ip | default('') }}" # Provide the IP of the NFS server
    server_share_path: "{{ _entry.server_share_path | default('') }}" # Provide server share path of the NFS Server
    client_share_path: {{ _entry.client_share_path | default('') }}
    client_mount_options: "{{ _entry.client_mount_options | default('nosuid,rw,sync,hard,intr') }}"
{% if _entry.nfs_name is defined %}
    nfs_name: {{ _entry.nfs_name }}
{% endif %}

{% endfor %}


================================================
FILE: upgrade/roles/import_input_parameters/templates/telemetry_config.j2
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# ***********************************************************************
# DO NOT REMOVE OR COMMENT OUT ANY LINES IN THIS FILE.
# SIMPLY APPEND THE REQUIRED VALUES AGAINST THE PARAMETER OF YOUR CHOICE.
# ***********************************************************************

# ============================================================================
# TELEMETRY CONFIGURATION OVERVIEW
# ============================================================================
# This file configures telemetry data collection and storage for Dell Omnia.
#
# SECTIONS:
#   1. iDRAC Telemetry    : Hardware metrics from Dell PowerEdge servers
#   2. VictoriaMetrics    : Time-series database for metric storage
#   3. Kafka              : Distributed streaming platform for telemetry data
#   4. LDMS               : Lightweight Distributed Metric Service for compute nodes
#
# ============================================================================
# STORAGE REQUIREMENTS SUMMARY
# ============================================================================
# 
# VICTORIAMETRICS STORAGE:
# ┌─────────────────┬──────────────────┬─────────────────┬──────────────────┐
# │ Deployment Mode │ Per-Pod Storage  │ Number of Pods  │ Total Storage    │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Single-node     │ persistence_size │ 1 pod           │ 1× storage       │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Cluster         │ persistence_size │ 3 vmstorage     │ 3× storage       │
# └─────────────────┴──────────────────┴─────────────────┴──────────────────┘
# Example: 8Gi per pod → Single-node: 8Gi total, Cluster: 24Gi total
#
# KAFKA STORAGE:
# ┌─────────────────┬──────────────────┬─────────────────┬──────────────────┐
# │ Component       │ Per-Pod Storage  │ Number of Pods  │ Total Storage    │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Kafka Broker    │ persistence_size │ 3 pods          │ 3× storage       │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ Kafka Controller│ persistence_size │ 3 pods          │ 3× storage       │
# ├─────────────────┼──────────────────┼─────────────────┼──────────────────┤
# │ TOTAL KAFKA     │ persistence_size │ 6 pods          │ 6× storage       │
# └─────────────────┴──────────────────┴─────────────────┴──────────────────┘
# Example: 8Gi per pod → 48Gi total Kafka storage
#
# COMBINED STORAGE EXAMPLES:
#   Default (8Gi each): VictoriaMetrics Cluster (24Gi) + Kafka (48Gi) = 72Gi total
#   Single-node mode:   VictoriaMetrics Single (8Gi) + Kafka (48Gi) = 56Gi total
#
# STORAGE OPTIONS:
#   - VictoriaMetrics: Store iDRAC telemetry in time-series database
#   - Kafka: Stream iDRAC and LDMS telemetry to Kafka topics
#   - Both: Store iDRAC in both Victoria and Kafka (recommended)
# ============================================================================

# ============================================================================
# iDRAC TELEMETRY CONFIGURATION
# ============================================================================
# iDRAC telemetry collects hardware metrics from Dell PowerEdge servers.
# Telemetry data can be stored in VictoriaMetrics, Kafka, or both.

# Enable or disable iDRAC telemetry support
# Accepted values: true or false
# Default: true
idrac_telemetry_support: {{ telemetry_idrac_telemetry_support | default(true) | bool | ternary('true', 'false') }}

# Specify where to store iDRAC telemetry data
# Supported values:
#   - "victoria"        : Store in VictoriaMetrics only
#   - "kafka"           : Store in Kafka only
#   - "victoria,kafka"  : Store in both (recommended)
# Default: "victoria,kafka"
idrac_telemetry_collection_type: {{ telemetry_idrac_telemetry_collection_type | default('victoria,kafka') | to_json }}

# ============================================================================
# VICTORIAMETRICS CONFIGURATION
# ============================================================================
# VictoriaMetrics is a time-series database for storing telemetry metrics.
# Used for iDRAC telemetry when 'victoria' is enabled in idrac_telemetry_collection_type.
#
# DEPLOYMENT MODES:
#   - single-node: Simple deployment with one pod (suitable for small deployments)
#   - cluster: High-availability deployment with multiple components
#               (recommended for production and large-scale deployments)
victoria_configurations:
  # VictoriaMetrics deployment mode
  # Supported values:
  #   - "single-node" : Simple deployment (1 pod, suitable for dev/test)
  #   - "cluster"     : High-availability deployment (7 pods, recommended for production)
  # Default: "cluster"
  #
  # Cluster Mode Benefits:
  #   - High availability (no single point of failure)
  #   - Horizontal scalability (scale components independently)
  #   - Better performance (4x ingestion, 2x query speed)
  #   - Production-ready architecture
  #
  # Single-Node Benefits:
  #   - Simple setup (fewer resources)
  #   - Suitable for small deployments (<10 nodes)
  #   - Lower resource usage (~4Gi memory vs ~10Gi for cluster)
  deployment_mode: {{ telemetry_victoria_deployment_mode | default('cluster') | to_json }}

  # The amount of storage allocated for EACH VictoriaMetrics persistent volume.
  # IMPORTANT: Total VictoriaMetrics storage depends on deployment mode:
  #   - Single-node mode: Total storage = persistence_size × 1 pod
  #   - Cluster mode: Total storage = persistence_size × 3 vmstorage pods
  #   - Example (cluster): 8Gi × 3 = 24Gi total VictoriaMetrics storage
  # Accepted values: in the form of "X[Ki|Mi|Gi|Ti|Pi|Ei]"
  # Default: 8Gi (results in 24Gi total storage for cluster mode)
  persistence_size: {{ telemetry_victoria_persistence_size | default('8Gi') | to_json }}

  # Duration (in hours) to retain victoria logs before they are deleted.
  # Default: 168 (7 days)
  retention_period: {{ telemetry_victoria_retention_period | default(168) }}

# ============================================================================
# KAFKA CONFIGURATION
# ============================================================================
# Apache Kafka is a distributed streaming platform for storing telemetry data.
# Used for iDRAC telemetry when 'kafka' is enabled in idrac_telemetry_collection_type.
# Also used for LDMS telemetry when LDMS software is configured.
#
# NOTE: Kafka topics are auto-generated based on enabled features:
#   - 'idrac' topic: Required when idrac_telemetry_support=true and 'kafka' is enabled
#   - 'ldms' topic:  Required when LDMS is configured in software_config.json
kafka_configurations:
  # The amount of storage allocated for EACH Kafka persistent volume.
  # IMPORTANT: Total Kafka storage = persistence_size × 6 pods
  #   - 3 Kafka brokers (each gets persistence_size storage)
  #   - 3 Kafka controllers (each gets persistence_size storage)
  #   - Example: 8Gi × 6 = 48Gi total Kafka storage
  # Accepted values: in the form of "X[Ki|Mi|Gi|Ti|Pi|Ei]"
  # Default: 8Gi (results in 48Gi total Kafka storage)
  persistence_size: {{ telemetry_kafka_persistence_size | default('8Gi') | to_json }}

  # The number of hours to retain Kafka logs before they are deleted.
  # Default: 168 (7 days)
  log_retention_hours: {{ telemetry_kafka_log_retention_hours | default(168) }}

  # The maximum size of Kafka logs (in bytes) before they are deleted.
  # Default: -1 (unlimited)
  log_retention_bytes: {{ telemetry_kafka_log_retention_bytes | default(-1) }}

  # The maximum size of Kafka log segments (in bytes) before they are deleted.
  # Default: 1073741824 (1 GB)
  log_segment_bytes: {{ telemetry_kafka_log_segment_bytes | default(1073741824) }}

  # Kafka Topic Partitions Configuration
  # ----------------------------------------------------------------------------
  # Define the number of partitions for each Kafka topic.
  # Increasing partitions can improve throughput but also increases storage/overhead.
  #
  # IMPORTANT: Topic names are FIXED and cannot be changed.
  #   - Topic names: Only 'idrac' and 'ldms' are allowed
  #   - Configurable: Only partition counts can be modified
  #
  # Topic Requirements (auto-validated):
  #   - 'idrac': Required when idrac_telemetry_support=true and 'kafka' is enabled
  #   - 'ldms':  Required when LDMS software is configured in software_config.json
  #
  # Default partition counts: idrac=1, ldms=2
  topic_partitions:
{% for _topic in (telemetry_kafka_topic_partitions | default([])) %}
    - name: {{ _topic.name | default('') | to_json }}
      partitions: {{ _topic.partitions | default(1) }}
{% endfor %}

# ============================================================================
# LDMS (Lightweight Distributed Metric Service) CONFIGURATION
# ============================================================================
# LDMS collects performance metrics from compute nodes (CPU, memory, network, etc.)
# and streams them to Kafka for storage and analysis.
#
# PREREQUISITE: To enable LDMS support, add the following to software_config.json:
#   {
#     "softwares": [
#       {"name": "ldms", "arch": ["x86_64", "aarch64"]}
#     ]
#   }
#
# When LDMS software is configured, the 'ldms' topic MUST be defined in
# kafka_configurations.topic_partitions above.
#
# LDMS Port Configurations
# Aggregator port on service k8s cluster
# Valid range: 6001-6100
# Default: 6001
ldms_agg_port: {{ telemetry_ldms_agg_port | default(6001) }}

# Store daemon port on service k8s cluster
# Can be the same as ldms_agg_port
# Valid range: 6001-6100
# Default: 6001
ldms_store_port: {{ telemetry_ldms_store_port | default(6001) }}

# Sampler port on compute nodes
# Valid range: 10001-10100
# Default: 10001
ldms_sampler_port: {{ telemetry_ldms_sampler_port | default(10001) }}

# LDMS Sampler Plugin Configurations
# ----------------------------------------------------------------------------
# Configure which metrics to collect from compute nodes and collection intervals.
# Each plugin collects specific system metrics.
#
# Parameters:
#   - plugin_name: Name of the LDMS sampler plugin
#   - config_parameters: Plugin-specific configuration (as a single string)
#   - activation_parameters: Collection schedule in MICROSECONDS
#       Format: "interval=<microseconds> offset=<microseconds>"
#       Example: "interval=1000000"         (1000000 microseconds = 1 second)
#                "interval=1000000 offset=0" (1000000 microseconds with no offset)
#
# Available Plugins:
#   - meminfo: Memory usage statistics
#   - procstat2: Process statistics
#   - vmstat: Virtual memory statistics
#   - loadavg: System load average
#   - procnetdev2: Network interface statistics
ldms_sampler_configurations:
{% if telemetry_ldms_sampler_configurations is none %}
  null
{% else %}
{% for _plugin in (telemetry_ldms_sampler_configurations | default([])) %}
  - plugin_name: {{ _plugin.plugin_name | default('') }}
    config_parameters: {{ _plugin.config_parameters | default('') | to_json }}
    activation_parameters: {{ _plugin.activation_parameters | default('interval=1000000') | to_json }}
{% endfor %}
{% endif %}


================================================
FILE: upgrade/roles/import_input_parameters/vars/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# backup_location will be set from oim_metadata.yml upgrade_backup_dir
# Format: /opt/omnia/backups/upgrade/version_2.0.0.0/input/project_default
# Set dynamically from metadata, no static variable needed

# Path to oim_metadata.yml
oim_metadata_path: "/opt/omnia/.data/oim_metadata.yml"

backup_dir_mode: '0755'
default_file_mode: '0644'

# List to collect warnings during execution
upgrade_warnings: []

# Precheck backup location messages
msg_backup_location_missing: "backup_location must be provided"
msg_upgrade_backup_dir_missing: "upgrade_backup_dir not found in /opt/omnia/.data/oim_metadata.yml"

# Restore input files messages
msg_restore_item_name_missing: "restore_item must define 'name'"
msg_validation_failed: "Validation failed for {{ restore_item.name }}"
msg_backup_file_missing: "Backup file missing: {{ restore_item.name }}"
msg_user_registry_credential_missing: |-
  WARNING: user_registry_credential.yml not found in backup at
  {{ backup_location }}/user_registry_credential.yml
  This might be due to complete Omnia execution not being completed.
  Skipping restoration of this file.

# Omnia config credentials messages
msg_omnia_config_credentials_missing: |-
  WARNING: omnia_config_credentials.yml not found in backup at
  {{ backup_location }}/omnia_config_credentials.yml.
  This might be due to complete Omnia execution not being completed.
  Skipping restoration of this file.

msg_omnia_config_credentials_info_missing: |-
  INFO: Both omnia_config_credentials.yml and .omnia_config_credentials_key
  are not present in backup. This is expected if credentials
  were not configured in the source installation.

msg_omnia_config_credentials_success: |-
  omnia_config_credentials.yml restored and updated from backup.
  Backup: {{ backup_location }}/omnia_config_credentials.yml
  Target: {{ input_project_dir }}/omnia_config_credentials.yml
  Status: Updated with postgres credentials and re-encrypted (key file also restored)

msg_omnia_config_credentials_error: |-
  ERROR: Inconsistent state detected for omnia_config_credentials.yml:
  {% if not backup_omnia_config_credentials_key_stat.stat.exists and
     backup_omnia_config_credentials_content.stdout is defined and
     '$ANSIBLE_VAULT;' in backup_omnia_config_credentials_content.stdout %}
  - File is encrypted but key file (.omnia_config_credentials_key) is missing
  {% elif backup_omnia_config_credentials_key_stat.stat.exists and
     backup_omnia_config_credentials_content.stdout is defined and
     '$ANSIBLE_VAULT;' not in backup_omnia_config_credentials_content.stdout %}
  - Key file exists but file is not encrypted
  {% endif %}
  Please check the backup integrity and ensure both files are present
  in consistent states.

# Rescue warning messages
msg_user_registry_decrypt_error: |-
  ERROR: Failed to decrypt user_registry_credential.yml.
  The backup key file may be corrupted or incompatible.
  Please check the backup integrity and ensure the key file
  matches the encrypted file.

# User registry credential restore messages and modes
user_registry_file_mode: '0600'
user_registry_key_mode: '0600'
user_registry_file_name: "user_registry_credential.yml"
user_registry_key_name: ".local_repo_credentials_key"

msg_user_registry_encrypted_success: |-
  user_registry_credential.yml restored from backup.
  Backup: {{ backup_location }}/user_registry_credential.yml
  Target: {{ input_project_dir }}/user_registry_credential.yml
  Status: Encrypted (key file also restored)

msg_user_registry_plaintext_encrypted_success: |-
  user_registry_credential.yml was plaintext in backup.
  Copied and encrypted using provided key.
  Target: {{ input_project_dir }}/user_registry_credential.yml

msg_user_registry_plaintext_no_key: |-
  user_registry_credential.yml copied in plaintext (no key present in backup).
  Backup: {{ backup_location }}/user_registry_credential.yml
  Target: {{ input_project_dir }}/user_registry_credential.yml
  Note: No encryption performed because key is missing.

msg_user_registry_encrypted_missing_key: |-
  ERROR: Inconsistent state detected for user_registry_credential.yml:
  - File is encrypted but key file (.local_repo_credentials_key) is missing
  Please check the backup integrity and ensure both files are present
  in consistent states.

msg_omnia_config_decrypt_error: |-
  ERROR: Failed to decrypt omnia_config_credentials.yml.
  The backup key file may be corrupted or incompatible.
  Please check the backup integrity and ensure the key file
  matches the encrypted file.

msg_omnia_config_template_error: |-
  ERROR: Failed to generate updated omnia_config_credentials.yml.
  Template processing may have failed due to invalid data format.
  Please check the backup file format and ensure it contains valid YAML.

msg_omnia_config_encrypt_error: |-
  ERROR: Failed to encrypt updated omnia_config_credentials.yml.
  The key file may be corrupted or there may be permission issues.
  Please check the key file integrity and file permissions.

msg_decryption_failed: "Decryption failed. Check warnings for details."
msg_template_failed: "Template processing failed. Check warnings for details."
msg_encryption_failed: "Encryption failed. Check warnings for details."

# Network spec transformation messages
msg_backup_network_spec_missing: "Backup network_spec.yml missing"
msg_network_spec_missing: "network_spec.yml missing"
msg_network_spec_already_21: "network_spec.yml already in 2.1 format - overwriting"
msg_yaml_validation_failed: "YAML validation failed"
msg_ib_netmask_mismatch: "ib_network.netmask_bits must match admin_network.netmask_bits"
msg_ib_network_missing: "ib_network is mandatory"
msg_ib_subnet_missing: "ib_network.subnet is mandatory"
msg_using_backup_network_spec: "Using backup network_spec.yml (backup not modified)"

# High availability config transformation messages
msg_backup_ha_config_missing: "Backup high_availability_config.yml missing"
msg_ha_config_missing: "high_availability_config.yml missing"
msg_ha_config_already_21: "high_availability_config.yml already in 2.1 format - overwriting"
msg_ha_virtual_ip_missing: "service_k8s_cluster_ha.virtual_ip_address is mandatory"
msg_using_backup_ha_config: "Using backup high_availability_config.yml (backup not modified)"

# Local repo config transformation messages
msg_backup_local_repo_config_missing: "Backup local_repo_config.yml missing"
msg_local_repo_config_missing: "local_repo_config.yml missing"
msg_using_backup_local_repo_config: "Using backup local_repo_config.yml (backup not modified)"
msg_omnia_repo_url_rhel_x86_64_missing: "omnia_repo_url_rhel_x86_64 is mandatory"
msg_omnia_repo_url_rhel_aarch64_missing: "omnia_repo_url_rhel_aarch64 is mandatory"

# Provision config transformation messages
msg_backup_provision_config_missing: "Backup provision_config.yml missing"
msg_provision_config_missing: "provision_config.yml missing"
msg_using_backup_provision_config: "Using backup provision_config.yml (backup not modified)"
msg_pxe_mapping_file_path_missing: "pxe_mapping_file_path is mandatory"

# Storage config transformation messages
msg_backup_storage_config_missing: "storage_config.yml not found in backup at {{ backup_location }}/storage_config.yml"
msg_storage_config_missing: "storage_config.yml not found at {{ input_project_dir }}/storage_config.yml"
msg_nfs_client_params_missing: "storage_config.yml must define nfs_client_params with at least one entry"
msg_nfs_client_param_entry_missing_keys: "Each nfs_client_params entry must define server_ip, server_share_path, and client_share_path"
msg_using_backup_storage_config: "Transforming storage_config.yml from backup at {{ backup_location }}/storage_config.yml"

# Omnia config transformation messages
msg_backup_omnia_config_missing: "Backup omnia_config.yml missing"
msg_omnia_config_missing: "omnia_config.yml missing"
msg_using_backup_omnia_config: "Using backup omnia_config.yml (backup not modified)"
msg_slurm_cluster_missing: "slurm_cluster is mandatory"
msg_service_k8s_cluster_missing: "service_k8s_cluster is mandatory"

# Telemetry config transformation messages
msg_backup_telemetry_config_missing: "Backup telemetry_config.yml missing"
msg_telemetry_config_missing: "telemetry_config.yml missing"
msg_using_backup_telemetry_config: "Using backup telemetry_config.yml (backup not modified)"

### Restore summary messages
msg_restore_summary: |
  {{ restore_item.name }} restored from backup.
  Backup: {{ backup_location }}/{{ restore_item.name }}
  Target: {{ input_project_dir }}/{{ restore_item.name }}

# Restore summary message for network spec transformation
msg_network_spec_transform_summary: |
  network_spec.yml upgraded to 2.1 format.
  Backup preserved at: {{ backup_location }}/network_spec.yml
  Changes:
  - Added mandatory ib_network
  - Made primary_oim_bmc_ip optional
  - Aligned ib_network.netmask_bits with admin_network.netmask_bits

# Restore summary message for high availability config transformation
msg_ha_config_transform_summary: |
  high_availability_config.yml upgraded to 2.1 format.
  Backup preserved at: {{ backup_location }}/high_availability_config.yml
  Changes:
  - Ensured service_k8s_cluster_ha is a list
  - Ensured virtual_ip_address is present

# Restore summary message for local repo config transformation
msg_local_repo_config_transform_summary: |
  local_repo_config.yml upgraded to 2.1 format.
  Backup preserved at: {{ backup_location }}/local_repo_config.yml
  Changes:
  - Normalized repo URL keys to arch-specific schema
  - Migrated omnia_registry to user_registry (when present)
  - Ensured mandatory omnia_repo_url_rhel_* keys are present

# Restore summary message for provision config transformation
msg_provision_config_transform_summary: |
  provision_config.yml upgraded to 2.1 format.
  Backup preserved at: {{ backup_location }}/provision_config.yml
  Changes:
  - Ensured pxe_mapping_file_path, language, and default_lease_time are present

# Restore summary message for storage config transformation
msg_storage_config_transform_summary: |
  storage_config.yml upgraded to 2.1 format.
  Backup preserved at: {{ backup_location }}/storage_config.yml
  Changes:
  - Ensured nfs_client_params is present and entries contain required keys

# Restore summary message for omnia config transformation
msg_omnia_config_transform_summary: |
  omnia_config.yml upgraded to 2.1 format.
  Backup preserved at: {{ backup_location }}/omnia_config.yml
  Changes:
  - Ensured slurm_cluster and service_k8s_cluster are lists
  - Ensured required sections are present

# Restore summary message for telemetry config transformation
msg_telemetry_config_transform_summary: |
  telemetry_config.yml upgraded to 2.1 format.
  Backup preserved at: {{ backup_location }}/telemetry_config.yml
  Changes:
  - Rendered Omnia 2.1 telemetry template with values from 2.0 backup
  - Applied schema defaults for missing fields

# === Input files to restore from backup ===
# Add input files here that should be copied from backup_location to input_project_dir
# Each entry should have:
# - name: filename (required)
# - mode: file permissions (optional, defaults to default_file_mode)
# - validate_cmd: validation command (optional, runs after restore)
#
# Examples of files to add:
# - Static configuration files that don't need transformation
# - Files that are the same format in 2.0 and 2.1
# - Files where you want to preserve the backup values exactly
#
# DO NOT add files that require transformation (network_spec.yml, high_availability_config.yml, local_repo_config.yml,
# provision_config.yml, user_registry_credential.yml)
restore_input_files:
  - name: software_config.json
    mode: '0644'
    validate_cmd: "python3 -m json.tool '{{ input_project_dir }}/software_config.json'"
  - name: security_config.yml
    mode: '0644'
    validate_cmd: "python3 -c \"import yaml; yaml.safe_load(open('{{ input_project_dir }}/security_config.yml','r'))\""
  - name: pxe_mapping_file.csv
    mode: '0644'
    validate_cmd: ""


================================================
FILE: upgrade/roles/upgrade_cluster/tasks/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
- name: Gather NFS share paths from storage_config.yml
  ansible.builtin.set_fact:
    nfs_slurm_server_share_path: >-
      {{ nfs_params | selectattr('nfs_name', 'equalto', 'nfs_slurm')
      | map(attribute='server_share_path') | first | default('not specified') }}
    nfs_k8s_server_share_path: >-
      {{ nfs_params | selectattr('nfs_name', 'equalto', 'nfs_k8s')
      | map(attribute='server_share_path') | first | default('not specified') }}


- name: Display cluster reprovision guidance
  ansible.builtin.pause:
    prompt: "{{ '\x1b[32m' }}===================================================
          CLUSTER REPROVISION REQUIRED
      ==========================================================

      Cluster reprovisioning is required after upgrade to enable new features.

      Review and update new 2.1 input fields present at /opt/omnia/input/project_default/ directory before reprovisioning:


        1. local_repo_config.yml

            - Set rhel_subscription_repo_config_x86_64 (list of RHEL subscription repos for x86_64)

            - Set rhel_subscription_repo_config_aarch64 (list of RHEL subscription repos for aarch64)

            - Set additional_repos_x86_64 (list of extra repo URLs or file paths for x86_64)

            - Set additional_repos_aarch64 (list of extra repo URLs or file paths for aarch64)


        2. network_spec.yml (ib_network section)

            - Define InfiniBand fabric settings (subnet manager/BMC, IP ranges, VLAN if applicable)

            - Ensure host IB interfaces map to the IB network entries


        3. omnia_config.yml (slurm_cluster.config_source)

            - Use the new structure: config_source: { type: <local|url>, location: <path_or_url> }

            - Populate location to point to your Slurm config bundle (local path or remote URL)

            - New variable: skip_merge (boolean, default: false,  If skip_merge is set to true for a configuration source path,
              that configuration file will be applied directly without merging with defaults or existing configurations)

            - New variable: node_discovery_mode: 'Homogeneous' or 'Heterogeneous'

            - New variable: node_hardware_defaults:

              | Mode | What happens | iDRAC calls for 500 nodes |

              |---|---|---|

              Heterogeneous (default) | Each node queried individually 500

              Homogeneous with specs provided | Specs applied directly, no querying 0

              Homogeneous without specs | One node per group queried, specs shared 1 per group

              also provide node_hardware_defaults for groups where you want to apply specs


            - New sample fields under slurm_cluster for Slurm cgroup and NodeName definitions:

              NodeName entries (list of nodes with CPUs/RealMemory)


        4. software_config.json

            - Migrated as-is from backup during upgrade

            - Review and manually update as needed before proceeding.


      Optional: NFS cleanup (only if you are reprovisioning the cluster)

      If you choose to reprovision the cluster and your setup uses an NFS share for Kubernetes and/or Slurm, you may optionally perform an NFS
      cleanup beforehand:

        Detected NFS share paths from storage_config.yml:

          - Slurm (nfs_slurm) server_share_path:  {{ nfs_slurm_server_share_path }}

          - Kubernetes (nfs_k8s) server_share_path:  {{ nfs_k8s_server_share_path }}


        Clean stale mounts and confirm the NFS share is reachable and accessible.

        Remove any leftover cluster state on the NFS share that could conflict with a fresh deployment.


      Optional: Reprovision playbooks (run in order from the Omnia root directory)
        1. ansible-playbook prepare_oim/prepare_oim.yml

        2. ansible-playbook local_repo/local_repo.yml

        3. ansible-playbook build_image_x86_64/build_image_x86_64.yml

        4. Only if using aarch64 nodes (run after x86_64 image build):

        -> ansible-playbook build_image_aarch64/build_image_aarch64.yml

        5. ansible-playbook discovery/discovery.yml


      For detailed steps and prerequisites, follow the official Omnia documentation.


          ==================================================================
     ========================================================================

    {{ '\x1b[0m' }}"
    seconds: 1


================================================
FILE: upgrade/roles/upgrade_cluster/vars/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
storage_config_path: "/opt/omnia/input/project_default/storage_config.yml"
storage_content: "{{ lookup('file', storage_config_path, errors='ignore') | default('') }}"
storage_yaml: "{{ storage_content | from_yaml | default({}) }}"
nfs_params: "{{ storage_yaml.nfs_client_params | default([]) }}"


================================================
FILE: upgrade/roles/upgrade_oim/tasks/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Include import input parameters
  ansible.builtin.include_role:
    name: import_input_parameters


================================================
FILE: upgrade/roles/upgrade_oim/vars/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---


================================================
FILE: upgrade/rollback_omnia.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
- name: Rollback Omnia guidance
  hosts: localhost
  connection: local
  gather_facts: false
  vars:
    oim_metadata_path: "/opt/omnia/.data/oim_metadata.yml"
  tasks:
    - name: Read oim_metadata.yml for backup details
      ansible.builtin.slurp:
        src: "{{ oim_metadata_path }}"
      register: oim_metadata_slurp
      ignore_errors: true

    - name: Parse oim_metadata.yml
      ansible.builtin.set_fact:
        oim_metadata: "{{ oim_metadata_slurp.content | b64decode | from_yaml }}"
      when: oim_metadata_slurp is defined and oim_metadata_slurp.content is defined

    - name: Derive backup_version from upgrade_backup_dir
      ansible.builtin.set_fact:
        backup_version: "{{ (oim_metadata.upgrade_backup_dir | regex_search('version_([^/]+)', '\\1'))
          | default('previous version', true) }}"
      when: oim_metadata is defined and oim_metadata.upgrade_backup_dir is defined

    - name: Display rollback guidance (green)
      ansible.builtin.debug:
        msg:
          - "================================="
          - "       OMNIA ROLLBACK"
          - "================================="
          - ""
          - "[Rollback Actions]"
          - "1. Purpose: restore Omnia core to the last backup version (includes configs and container state)."
          - "2. Target version: {{ backup_version | default('previous version from the backup location') }}."
          - "3. How to run:"
          - "   - Exit the Omnia core container shell if you are inside it."
          - "   - From the OIM host prompt, execute: ./omnia.sh --rollback"
          - "4. Note: ensure the backup location is accessible on the OIM host before running rollback."
    - name: End play
      ansible.builtin.meta: end_play


================================================
FILE: upgrade/upgrade_cluster.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Upgrade cluster tasks
  hosts: localhost
  connection: local
  roles:
    - role: upgrade_cluster


================================================
FILE: upgrade/upgrade_oim.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Upgrade OIM tasks
  hosts: localhost
  connection: local
  roles:
    - role: ../utils/roles/include_input_dir
    - role: upgrade_oim


================================================
FILE: upgrade/upgrade_omnia.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Upgrade OIM tasks
  ansible.builtin.import_playbook: upgrade_oim.yml

- name: Upgrade cluster tasks
  ansible.builtin.import_playbook: upgrade_cluster.yml

- name: Clear upgrade guard lock
  hosts: localhost
  connection: local
  gather_facts: false
  tasks:
    - name: Remove upgrade guard lock
      ansible.builtin.file:
        path: /opt/omnia/.data/upgrade_in_progress.lock
        state: absent


================================================
FILE: utils/ansible.cfg
================================================
[defaults]
log_path = /opt/omnia/log/core/playbooks/utils.log
remote_tmp = /opt/omnia/tmp/.ansible/tmp/
host_key_checking = false
forks = 5
timeout = 180
executable = /bin/bash
library = ../common/library/modules
module_utils = ../common/library/module_utils

[persistent_connection]
command_timeout = 180
connect_timeout = 180

[ssh_connection]
retries = 3
ssh_args = -o ControlMaster=auto -o ControlPersist=60 -o ConnectTimeout=60


================================================
FILE: utils/create_container_group.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Create container group
  hosts: localhost
  connection: local
  roles:
    - create_container_group


================================================
FILE: utils/credential_utility/ansible.cfg
================================================
[defaults]
log_path = /opt/omnia/log/core/playbooks/credential_utility.log
remote_tmp = /opt/omnia/tmp/.ansible/tmp/
host_key_checking = false
forks = 5
timeout = 180
executable = /bin/bash
library = ../../common/library/modules
module_utils = ../../common/library/module_utils

[persistent_connection]
command_timeout = 180
connect_timeout = 180

[ssh_connection]
retries = 3
ssh_args = -o ControlMaster=auto -o ControlPersist=60 -o ConnectTimeout=60

================================================
FILE: utils/credential_utility/get_config_credentials.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Check if upgrade is in progress
  ansible.builtin.import_playbook: ../upgrade_checkup.yml
  tags: always

- name: Include input project directory
  when: not project_dir_status | default(false) | bool
  ansible.builtin.import_playbook: ../include_input_dir.yml
  tags: always

- name: Create and update credential config files
  hosts: localhost
  connection: local
  roles:
    - validation
    - create_config
    - update_config
  tags: always


================================================
FILE: utils/credential_utility/roles/create_config/tasks/create_credential_file.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: "Create credentials file - {{ credential_type }}"
  ansible.builtin.template:
    src: "{{ credential_template }}"
    dest: "{{ credential_file_path }}"
    mode: "{{ credential_file_mode }}"
  when:
    - credential_file_path is not file
    - credential_condition | default(false) | bool
  register: file_created

- name: Include credentials from newly created file
  ansible.builtin.include_vars:
    file: "{{ credential_file_path }}"
  when:
    - file_created is changed
    - credential_file_path is file

- name: "Create vault key file if not exists - {{ credential_type }}"
  ansible.builtin.lineinfile:
    path: "{{ vault_password_file }}"
    line: "{{ lookup('password', '/dev/null chars=ascii_letters length=32') }}"
    mode: "0600"
    owner: root
    create: true
  when:
    - vault_password_file is defined
    - vault_password_file is not file

- name: "Encrypt newly created credential file - {{ credential_type }}"
  ansible.builtin.command: >-
    ansible-vault encrypt "{{ credential_file_path }}"
    --vault-password-file "{{ vault_password_file }}"
  when:
    - file_created is changed
    - credential_file_path is file
    - vault_password_file is defined
  changed_when: false


================================================
FILE: utils/credential_utility/roles/create_config/tasks/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Include vars for encrypted credentials
  ansible.builtin.include_tasks: "{{ role_path }}/../../../../common/tasks/common/decrypt_include_encrypt.yml"
  loop: "{{ credential_files }}"
  loop_control:
    loop_var: cred_config
  when:
    - cred_config.file_path is file
  vars:
    credential_file_path: "{{ cred_config.file_path }}"
    vault_password_file: "{{ cred_config.vault_path }}"

- name: Create credential files
  ansible.builtin.include_tasks: create_credential_file.yml
  vars:
    credential_type: "{{ cred_config.credential_type }}"
    credential_template: "{{ cred_config.template }}"
    credential_file_path: "{{ cred_config.file_path }}"
    credential_file_mode: "{{ cred_config.file_mode }}"
    vault_password_file: "{{ cred_config.vault_path }}"
    credential_condition: "{{ cred_config.condition | default(false) }}"
  loop: "{{ credential_files }}"
  loop_control:
    loop_var: cred_config
  when:
    - cred_config.file_path is not file


================================================
FILE: utils/credential_utility/roles/create_config/templates/build_stream_credential.j2
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# Build Stream Registrar credentials
auth_registration:
  username: "{{ build_stream_auth_username | default('') }}"
  password: "{{ build_stream_auth_password | default('') }}"
  password_hash: "{{ build_stream_auth_password_hash | default('') }}"


================================================
FILE: utils/credential_utility/roles/create_config/templates/omnia_credential.j2
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# Provision credentials
provision_password: ""
bmc_username: ""
bmc_password: ""

# Prepare_oim credentials
minio_s3_password: ""
pulp_password: ""
docker_username: ""
docker_password: ""

# Omnia credentials
slurm_db_password: ""

# Security credentials
openldap_db_username: ""
openldap_db_password: ""

# iDrac Telemetry credentials
mysqldb_user: ""
mysqldb_password: ""
mysqldb_root_password: ""

# csi powerscale credentials
csi_username: ""
csi_password: ""

# LDMS sampler
ldms_sampler_password: ""

# postgres credentials
postgres_user: ""
postgres_password: ""

# Gitlab credentials
gitlab_root_password: ""


================================================
FILE: utils/credential_utility/roles/create_config/vars/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
# Credential file configurations - centralized structure
credential_files:
  - credential_type: "Omnia"
    template: "{{ role_path }}/templates/omnia_credential.j2"
    file_path: "{{ input_project_dir }}/omnia_config_credentials.yml"
    file_mode: 600
    vault_path: "{{ input_project_dir }}/.omnia_config_credentials_key"
    condition: true
  - credential_type: "Build Stream"
    template: "{{ role_path }}/templates/build_stream_credential.j2"
    file_path: "{{ input_project_dir }}/build_stream_oauth_credentials.yml"
    file_mode: 600
    vault_path: "{{ input_project_dir }}/.build_stream_oauth_credentials_key"
    condition: "{{ enable_build_stream | default(false) | bool }}"


================================================
FILE: utils/credential_utility/roles/update_config/tasks/credential_status.yml
================================================
﻿# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# Initialize credential file status
- name: Check credential file status
  ansible.builtin.set_fact:
    omnia_cred_file_status: "{{ credential_files[0].file_path is file }}"
    bs_cred_file_status: "{{ credential_files[1].file_path is file }}"
    skipped_optional_credentials: >-
      {{ skipped_optional_credentials | default([]) }}

# Username: prompt if field exists, value is empty, credential type is active
# Skip if username was previously skipped (in skip list)
- name: Initialize username status
  ansible.builtin.set_fact:
    username_status: >-
      {{
        field.username is defined and
        field.username is not search('switch') and
        field.username not in
          (skipped_optional_credentials | default([])) and
        (
          ((field.file is not defined or
            field.file != credential_files[1].file_path) and
           (vars[field.username] is not defined or
            vars[field.username] == "" or
            (vars[field.username] | length == 0)) and
           (mandatory_credentials_status or
            conditional_mandatory_credentials_status or
            optional_credentials_status))
          or
          ((field.file is defined and
            field.file == credential_files[1].file_path) and
           (vars['build_stream_auth_username'] is not defined or
            vars['build_stream_auth_username'] == "" or
            (vars['build_stream_auth_username'] | length == 0)))
        )
      }}

# Password logic:
#   mandatory/conditional_mandatory: always prompt if password is empty
#   optional: prompt if username has value or will be prompted
#   build_stream: handle via separate credential file path
- name: Initialize password status
  ansible.builtin.set_fact:
    password_status: >-
      {{
        field.password is defined and
        field.password is not search('switch') and
        (
          ((field.file is not defined or
            field.file != credential_files[1].file_path) and
           (vars[field.password] is not defined or
            vars[field.password] == "" or
            (vars[field.password] | length == 0)) and
           (
             (mandatory_credentials_status | default(false) | bool or
              conditional_mandatory_credentials_status |
              default(false) | bool)
             or
             (optional_credentials_status | default(false) | bool and
              field.username is defined and
              ((vars[field.username] is defined and
                vars[field.username] != "") or
               (username_status | default(false) | bool)))))
          or
          ((field.file is defined and
            field.file == credential_files[1].file_path) and
           (vars['build_stream_auth_password_hash'] is not defined or
            vars['build_stream_auth_password_hash'] == "" or
            (vars['build_stream_auth_password_hash'] | length == 0)))
        )
      }}

# Track skipped optional credentials to avoid re-prompting
- name: Add skipped optional credentials to skip list
  ansible.builtin.set_fact:
    skipped_optional_credentials: >-
      {{ (skipped_optional_credentials | default([])) +
         [field.username] }}
  when:
    - field.username is defined
    - optional_credentials_status | default(false) | bool
    - username_status | default(false) | bool
    - vars[field.username] is not defined or
      vars[field.username] == ""

# Reset credential status after processing
- name: Reset credentials status
  ansible.builtin.set_fact:
    mandatory_credentials_status: false
    conditional_mandatory_credentials_status: false
    optional_credentials_status: false
    username_status: false
    password_status: false
  when: reset_status | default(false)


================================================
FILE: utils/credential_utility/roles/update_config/tasks/fetch_conditional_mandatory_credentials.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Set conditional mandatory credentials status for conditional credentials
  ansible.builtin.set_fact:
    conditional_mandatory_credentials_status: true

- name: Notify user about conditional mandatory inputs
  ansible.builtin.debug:
    msg: "{{ conditional_mandatory_warning_msg | default('Conditional mandatory credentials will be prompted based on configuration') }}"

- name: Filter conditional mandatory credentials based on condition
  ansible.builtin.set_fact:
    filtered_credentials: "{{ type.value | selectattr('condition', 'defined') | list if type.value is iterable else [] }}"

- name: Fetch conditional mandatory credentials
  ansible.builtin.include_tasks: prompt_credentials.yml
  loop: "{{ filtered_credentials }}"
  loop_control:
    loop_var: field
  when:
    - filtered_credentials | length > 0
    - field.condition | default(false) | bool

- name: Reset mandatory credentials status
  ansible.builtin.set_fact:
    mandatory_credentials_status: false


================================================
FILE: utils/credential_utility/roles/update_config/tasks/fetch_credentials.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Initialize credentials status
  ansible.builtin.set_fact:
    mandatory_credentials_status: false
    conditional_mandatory_credentials_status: false
    optional_credentials_status: false
    username_status: false
    password_status: false

- name: Prompt to fetch credentials
  ansible.builtin.include_tasks: "fetch_{{ type.key }}_credentials.yml"
  loop: "{{ service.value | dict2items }}"
  loop_control:
    loop_var: type
  when:
    - >-
      service.key in software_names or
      service.key in ["provision", "prepare_oim","local_repo","idrac_telemetry","visualization", "build_aarch_image", "gitlab", "csi_driver_powerscale"]
    - (omnia_run_tags | default([]) | difference(['all']) | length == 0)
      or service.key in (omnia_run_tags | default([]))


================================================
FILE: utils/credential_utility/roles/update_config/tasks/fetch_mandatory_credentials.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Set mandatory credentials status
  ansible.builtin.set_fact:
    mandatory_credentials_status: true

- name: Notify user about mandatory inputs
  ansible.builtin.debug:
    msg: "{{ mandatory_warning_msg }}"

- name: Fetch mandatory credentials
  ansible.builtin.include_tasks: prompt_credentials.yml
  loop: "{{ type.value }}"
  loop_control:
    loop_var: field

- name: Reset mandatory credentials status
  ansible.builtin.set_fact:
    mandatory_credentials_status: false


================================================
FILE: utils/credential_utility/roles/update_config/tasks/fetch_optional_credentials.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Set optional credentials status
  ansible.builtin.set_fact:
    optional_credentials_status: true

- name: Notify user about optional inputs
  ansible.builtin.debug:
    msg: "{{ optional_warning_msg }}"

- name: Fetch optional credentials
  ansible.builtin.include_tasks: prompt_credentials.yml
  loop: "{{ type.value }}"
  loop_control:
    loop_var: field

- name: Reset optional credentials status
  ansible.builtin.set_fact:
    optional_credentials_status: false


================================================
FILE: utils/credential_utility/roles/update_config/tasks/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Set common library path
  ansible.builtin.set_fact:
    module_utils_path: "{{ role_path }}/../../../../common/library/module_utils/"

- name: Pre-load build stream credentials if they exist
  when:
    - enable_build_stream | default(false) | bool
    - credential_files[1].file_path is file
  block:
    - name: Set variables for common task
      ansible.builtin.set_fact:
        cred_file_path: "{{ credential_files[1].file_path }}"
        cred_vault_path: "{{ credential_files[1].vault_path }}"

    - name: Include build stream credentials using common task
      ansible.builtin.include_tasks: "{{ role_path }}/../../../../common/tasks/common/decrypt_include_encrypt.yml"
      vars:
        credential_file_path: "{{ cred_file_path }}"
        vault_password_file: "{{ cred_vault_path }}"

    - name: Set build_stream variables from auth_registration
      ansible.builtin.set_fact:
        build_stream_auth_username: "{{ auth_registration.username | default('') }}"
        build_stream_auth_password: "{{ auth_registration.password | default('') }}"
        build_stream_auth_password_hash: "{{ auth_registration.password_hash | default('') }}"
      no_log: true

- name: Fetch credentials
  ansible.builtin.include_tasks: fetch_credentials.yml
  loop: "{{ omnia_credentials | dict2items }}"
  loop_control:
    loop_var: service

- name: Include updated credentials
  ansible.builtin.include_tasks: "{{ role_path }}/../../../../common/tasks/common/decrypt_include_encrypt.yml"
  loop: "{{ credential_files }}"
  loop_control:
    loop_var: cred_config
  when:
    - cred_config.condition | default(true) | bool
    - cred_config.file_path is file
  vars:
    credential_file_path: "{{ cred_config.file_path }}"
    vault_password_file: "{{ cred_config.vault_path }}"


================================================
FILE: utils/credential_utility/roles/update_config/tasks/prompt_credentials.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# Main orchestrator for credential prompting
# This file coordinates the credential prompting workflow by calling specialized task files

# Initialize credential status
- name: Initialize credential status
  ansible.builtin.include_tasks: credential_status.yml

# Prompt credentials for service
- name: Prompt credentials for "{{ service.key }} - {{ type.key }}" # noqa name[template]
  when: username_status or password_status
  block:
    # Prompt for username
    - name: Prompt for username
      ansible.builtin.include_tasks: prompt_username.yml

    # Prompt for password
    - name: Prompt for password
      ansible.builtin.include_tasks: prompt_password.yml

    # Update credential files
    - name: Update credential files
      ansible.builtin.include_tasks: update_credentials.yml

    # Reset status after processing
    - name: Reset credential status
      ansible.builtin.include_tasks: credential_status.yml
      vars:
        reset_status: true


================================================
FILE: utils/credential_utility/roles/update_config/tasks/prompt_password.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# Prompt for password if needed
- name: Fetch "{{ field.password | default('Password') }}" if empty # noqa name[template]
  when: password_status
  block:
    - name: Fetch credential rule for "{{ field.password | default('Password') }}" # noqa name[template]
      fetch_credential_rule:
        credential_field: "{{ field.password }}"
        module_utils_path: "{{ module_utils_path }}"
      register: credential_rule

    - name: Prompt user for "{{ field.password | default('Password') }}" # noqa name[template]
      ansible.builtin.pause:
        prompt: "[{{ field.password }}] {{ lookup('vars', type.key ~ '_input') }} {{ credential_rule.msg }} Enter value"
        echo: false
      no_log: true
      register: password_input

    - name: Validate mandatory password not empty
      ansible.builtin.fail:
        msg: "{{ mandatory_password_fail_msg }}"
      when:
        - username_status or mandatory_credentials_status
        - password_input.user_input | length == 0

    - name: Validate input credential - "{{ field.password | default('Password') }}" # noqa name[template]
      validate_credentials:
        credential_field: "{{ field.password }}"
        credential_input: "{{ password_input.user_input }}"
        module_utils_path: "{{ module_utils_path }}"
      when: password_input.user_input | length != 0

    - name: Prompt user to confirm "{{ field.password | default('Password') }}" # noqa name[template]
      ansible.builtin.pause:
        prompt: "Confirm [{{ type.key }}] - {{ field.password }}"
        echo: false
      no_log: true
      register: confirm_password
      when:
        - password_input.user_input is defined
        - password_input.user_input | length != 0

    - name: Ensure passwords match
      ansible.builtin.fail:
        msg: "{{ password_match_fail_msg }}"
      when:
        - password_input.user_input | length != 0
        - password_input.user_input != confirm_password.user_input

    - name: Set username status when username is empty for OPTIONAL credential
      ansible.builtin.set_fact:
        username_status: false
        password_status: false
      when:
        - not mandatory_credentials_status
        - password_input.user_input | length == 0

  rescue:
    - name: Failed to fetch credentials with entered password
      ansible.builtin.fail:
        msg: "{{ password_fail_msg }}"


================================================
FILE: utils/credential_utility/roles/update_config/tasks/prompt_username.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# Prompt for username if needed
- name: Fetch username if empty # noqa name[template]
  when: username_status
  block:
    - name: Fetch credential rule for "{{ field.username | default('Username') }}" # noqa name[template]
      fetch_credential_rule:
        credential_field: "{{ field.username }}"
        module_utils_path: "{{ module_utils_path }}"
      register: credential_rule

    - name: Show Docker Hub usage warning
      ansible.builtin.pause:
        prompt: "{{ docker_hub_warning }}"
      when: field.username is defined and field.username == 'docker_username'

    - name: Prompt user for "{{ field.username | default('Username') }}" # noqa name[template]
      ansible.builtin.pause:
        prompt: "[{{ field.username }}] {{ lookup('vars', type.key ~ '_input') }} {{ credential_rule.msg }} Enter value"
      no_log: true
      register: username_input

    - name: Validate mandatory username not empty
      ansible.builtin.fail:
        msg: "{{ mandatory_credentials_msg }}"
      when:
        - mandatory_credentials_status
        - username_input.user_input | length == 0

    - name: Set username status when username is empty for OPTIONAL credential
      ansible.builtin.set_fact:
        username_status: false
        password_status: false
      when:
        - not mandatory_credentials_status
        - username_input.user_input | length == 0

    - name: Validate input credential - "{{ field.username | default('Username') }}" # noqa name[template]
      validate_credentials:
        credential_field: "{{ field.username }}"
        credential_input: "{{ username_input.user_input }}"
        module_utils_path: "{{ module_utils_path }}"
      when: username_input.user_input | length != 0

  rescue:
    - name: Failed to credentials with entered username
      ansible.builtin.fail:
        msg: "{{ username_fail_msg }}"


================================================
FILE: utils/credential_utility/roles/update_config/tasks/update_bs_credential_file.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Update build_stream credentials
  block:
    - name: Set build_stream_auth_username from user input
      ansible.builtin.set_fact:
        build_stream_auth_username: "{{ username_input.user_input }}"
      no_log: true
      when:
        - username_status | default(false)
        - username_input is defined
        - username_input.user_input is defined
        - username_input.user_input | length > 0

    - name: Use existing username when username not updated
      ansible.builtin.set_fact:
        build_stream_auth_username: "{{ vars['build_stream_auth_username'] | default('') }}"
      no_log: true
      when: not username_status | default(false)

    - name: Set build_stream_auth_password from user input
      ansible.builtin.set_fact:
        build_stream_auth_password: "{{ password_input.user_input }}"
      no_log: true
      when:
        - password_status | default(false)
        - password_input is defined
        - password_input.user_input is defined
        - password_input.user_input | length > 0

    - name: Use existing password when password not updated
      ansible.builtin.set_fact:
        build_stream_auth_password: "{{ vars['build_stream_auth_password'] | default('') }}"
      no_log: true
      when: not password_status | default(false)

    - name: Install argon2-cffi package
      ansible.builtin.pip:
        name: argon2-cffi
        state: present
      delegate_to: localhost

    - name: Generate Argon2 password hash for build stream registrar
      generate_argon2_password:
        password: "{{ password_input.user_input }}"
      register: password_hash
      no_log: true
      delegate_to: localhost
      when:
        - password_status | default(false)
        - password_input is defined
        - password_input.user_input is defined
        - password_input.user_input | length > 0

    - name: Set password hash variable
      ansible.builtin.set_fact:
        build_stream_auth_password_hash: "{{ password_hash.pswd_argon2 }}"
      no_log: true
      when:
        - password_hash is defined
        - password_hash is succeeded
        - password_hash.pswd_argon2 is defined

    - name: Use existing password hash when password not updated
      ansible.builtin.set_fact:
        build_stream_auth_password_hash: "{{ vars['build_stream_auth_password_hash'] | default('') }}"
      no_log: true
      when: not password_status | default(false) or password_hash is not defined or password_hash is not succeeded

    - name: Update build_stream credential file
      ansible.builtin.template:
        src: "{{ role_path }}/../create_config/templates/build_stream_credential.j2"
        dest: "{{ bs_credential_file }}"
        mode: "{{ bs_credential_file_mode }}"
      no_log: true

    - name: Encrypt build_stream credential file after updates
      ansible.builtin.command: >-
        ansible-vault encrypt "{{ bs_credential_file }}"
        --vault-password-file "{{ bs_credential_vault_path }}"
      when: bs_credential_file is file
      changed_when: false

  rescue:
    - name: Encrypt build_stream credential file on error
      ansible.builtin.command: >-
        ansible-vault encrypt "{{ bs_credential_file }}"
        --vault-password-file "{{ bs_credential_vault_path }}"
      when: bs_credential_file is file
      changed_when: false

    - name: Fail to update build stream credentials
      ansible.builtin.fail:
        msg: "Failed to update build_stream credentials"


================================================
FILE: utils/credential_utility/roles/update_config/tasks/update_credentials.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# Update credential files with new values
- name: Update credential file with new values
  when: username_status or password_status
  block:
    - name: Set credential file paths
      ansible.builtin.set_fact:
        current_cred_file: "{{ field.file | default(credential_files[0].file_path) }}"
        current_vault_file: "{{ field.vault_path | default(credential_files[0].vault_path) }}"
        is_bs_file: "{{ field.file is defined and field.file == credential_files[1].file_path }}"

    - name: Check if credential file exists
      ansible.builtin.stat:
        path: "{{ current_cred_file }}"
      register: cred_file_check

    - name: Decrypt credential file for updates
      ansible.builtin.command: >-
        ansible-vault decrypt {{ current_cred_file }}
        --vault-password-file {{ current_vault_file }}
      when: cred_file_check.stat.exists
      changed_when: false
      failed_when: false

    - name: Update build_stream credential file
      ansible.builtin.include_tasks: update_bs_credential_file.yml
      vars:
        bs_credential_file: "{{ credential_files[1].file_path }}"
        bs_credential_file_mode: "{{ credential_files[1].mode | default('0600') }}"
        bs_credential_vault_path: "{{ credential_files[1].vault_path }}"
      when: is_bs_file

    - name: Update vars file with entered username
      ansible.builtin.lineinfile:
        path: "{{ current_cred_file }}"
        regexp: '^{{ field.username }}:'
        line: "{{ field.username }}: \"{{ username_input.user_input }}\""
      no_log: true
      when:
        - username_status
        - not is_bs_file

    - name: Update vars file with entered password
      ansible.builtin.lineinfile:
        path: "{{ current_cred_file }}"
        regexp: '^{{ field.password }}:'
        line: "{{ field.password }}: \"{{ password_input.user_input }}\""
      no_log: true
      when:
        - password_status
        - not is_bs_file

    - name: Reload updated credential variables to prevent duplicate prompts
      ansible.builtin.include_vars: "{{ current_cred_file }}"
      when:
        - cred_file_check.stat.exists
        - not is_bs_file
      no_log: true

    - name: Encrypt credential file after updates
      ansible.builtin.command: >-
        ansible-vault encrypt {{ current_cred_file }}
        --vault-password-file {{ current_vault_file }}
      when:
        - cred_file_check.stat.exists
        - not is_bs_file
      changed_when: false

  rescue:
    - name: Encrypt credential file if it exists and is unencrypted
      ansible.builtin.shell: >-
        set -o pipefail &&
        if [ -f "{{ current_cred_file }}" ]; then
          if ! head -n1 "{{ current_cred_file }}" | grep -q '\$ANSIBLE_VAULT;'; then
            ansible-vault encrypt "{{ current_cred_file }}" --vault-password-file "{{ current_vault_file }}"
          fi
        fi
      when:
        - current_cred_file is defined
        - current_vault_file is defined
      changed_when: false

    - name: Fail with cleanup message
      ansible.builtin.fail:
        msg: "{{ credential_encrypt_fail_msg }}"


================================================
FILE: utils/credential_utility/roles/update_config/vars/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# Credential file configurations
credential_files:
  - credential_type: "Omnia"
    file_path: "{{ input_project_dir }}/omnia_config_credentials.yml"
    vault_path: "{{ input_project_dir }}/.omnia_config_credentials_key"
    condition: true
  - credential_type: "Build Stream"
    file_path: "{{ input_project_dir }}/build_stream_oauth_credentials.yml"
    vault_path: "{{ input_project_dir }}/.build_stream_oauth_credentials_key"
    condition: "{{ enable_build_stream | default(false) | bool }}"
    mode: 600
    template: "{{ role_path }}/../create_config/templates/build_stream_credential.j2"

# Usage: fetch_mandatory_credentials.yml
mandatory_warning_msg: "WARNING: The following are mandatory credentials and cannot be left empty. Please provide valid inputs."
mandatory_input: "is a [MANDATORY] credential and cannot be left empty."
optional_warning_msg: |
  WARNING: The following are optional credentials. If left empty, these credentials will be skipped.
  Please provide valid inputs or press Enter to skip.
optional_input: "is an [OPTIONAL] credential and can be left empty to skip."
conditional_mandatory_input: "is a [CONDITIONAL MANDATORY] credential and cannot be left empty when the feature is enabled."
conditional_mandatory_warning_msg: |
  WARNING: Conditional mandatory credentials will be prompted based on your configuration.
  These credentials are required when specific features are enabled and cannot be left empty.

# Usage: prompt_credentials.yml
mandatory_password_fail_msg: "Failed. Password is required for mandatory credential or any username input. Please provide valid password."
password_match_fail_msg: "Failed. Passwords do not match. Please try again."
password_fail_msg: "Failed. Please provide valid password."
mandatory_credentials_msg: "Failed. Please provide valid username for mandatory credential."
username_fail_msg: "Failed. Please provide valid username."
credential_encrypt_fail_msg: "Failed to encrypt credential file."

# Usage: update_bs_credential_file.yml
password_hash_fail_msg: "Failed to generate Argon2 password hash for build stream registrar. Please check the password format and try again."
file_update_fail_msg: "Failed to update build_stream_oauth_credentials.yml. Please check file permissions and disk space."
bs_encrypt_fail_msg: "Failed to encrypt build_stream_oauth_credentials.yml. Please check vault password and file permissions."

docker_hub_warning: |
  Docker Hub Usage Warning:
  Unauthenticated access may result in rate limiting or throttling.
  Login for higher pull limits and reliable access.
  Proceed to enter your Docker credentials if you want to avoid pull rate limits.
  Press Enter.

omnia_credentials:
  provision:
    mandatory:
      - { password: provision_password }
      - { username: bmc_username, password: bmc_password }
  gitlab:
    mandatory:
      - { password: gitlab_root_password }
    optional:
      - { username: docker_username, password: docker_password }
  prepare_oim:
    optional:
      - { username: docker_username, password: docker_password }
    mandatory:
      - { password: pulp_password }
      - { password: minio_s3_password }
    conditional_mandatory:
      - username: build_stream_auth_username
        password: build_stream_auth_password
        condition: "{{ enable_build_stream | default(false) | bool }}"
        file: "{{ credential_files[1].file_path }}"
      - username: postgres_user
        password: postgres_password
        condition: "{{ enable_build_stream | default(false) | bool }}"
  local_repo:
    optional:
      - { username: docker_username, password: docker_password }
  slurm:
    mandatory:
      - { password: slurm_db_password }
  slurm_custom:
    mandatory:
      - { password: slurm_db_password }
  openldap:
    mandatory:
      - { username: openldap_db_username, password: openldap_db_password }
  idrac_telemetry:
    mandatory:
      - { username: bmc_username, password: bmc_password }
      - { username: mysqldb_user, password: mysqldb_password }
      - { password: mysqldb_root_password }
  csi_driver_powerscale:
    conditional_mandatory:
      - username: csi_username
        password: csi_password
        condition: "{{ csi_driver_powerscale_support | default(false) | bool }}"
  build_aarch_image:
    mandatory:
      - { password: provision_password }
  ldms:
    mandatory:
      - { password: ldms_sampler_password }


================================================
FILE: utils/credential_utility/roles/validation/tasks/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Initialize list of tags
  ansible.builtin.set_fact:
    omnia_run_tags: "{{ ansible_run_tags | default([]) }}"
  when: omnia_run_tags is not defined

- name: Load build_stream_config.yml to check if enabled
  block:
    - name: Include build_stream_config.yml
      ansible.builtin.include_vars:
        file: "{{ input_project_dir }}/build_stream_config.yml"
      register: include_build_stream_config
  rescue:
    - name: Set enable_build_stream to false if config not found
      ansible.builtin.set_fact:
        enable_build_stream: false

- name: Validate credential files
  ansible.builtin.include_tasks: validate_cred_file.yml
  loop: "{{ credential_files }}"
  loop_control:
    loop_var: cred_config
  when: cred_config.condition | default(true) | bool
  vars:
    credential_type: "{{ cred_config.credential_type }}"
    credential_file_path: "{{ cred_config.file_path }}"
    status_var_name: "{{ cred_config.credential_type | lower | replace(' ', '_') }}_cred_file_status"

- name: Include pre_requisite.yml
  ansible.builtin.include_tasks: pre_requisite.yml


================================================
FILE: utils/credential_utility/roles/validation/tasks/pre_requisite.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Load software_config.json as software_config
  block:
    - name: Load software_config.json as user_config
      ansible.builtin.include_vars:
        file: "{{ software_config_file }}"
        name: software_config
      register: include_software_config
      no_log: true
  rescue:
    - name: Failed to load software_config.json as user_config
      ansible.builtin.fail:
        msg: "{{ software_config_syntax_fail_msg }} Error: {{ include_software_config.message }}"

- name: Generate software JSON file names
  ansible.builtin.set_fact:
    software_names: "{{ software_config.softwares | map(attribute='name') | select('defined') | list }}"

- name: Set support flags for credential conditions
  ansible.builtin.set_fact:
    csi_driver_powerscale_support: "{{ software_config.softwares | selectattr('name', 'equalto', 'csi_driver_powerscale') | list | length > 0 }}"
    service_k8s_support: "{{ software_config.softwares | selectattr('name', 'equalto', 'service_k8s') | list | length > 0 }}"
    openldap_support: "{{ software_config.softwares | selectattr('name', 'equalto', 'openldap') | list | length > 0 }}"

- name: Fetch telemetry status from telemetry_config.yml
  fetch_telemetry_status:
    input_path: "{{ input_project_dir }}"
  register: result
  when: "'telemetry' in (omnia_run_tags | default([]))"

- name: Set run tags for telemetry
  ansible.builtin.set_fact:
    omnia_run_tags: "{{ (omnia_run_tags | default([])) + (result.telemetry_status_list | default([])) | unique }}"
  when:
    - not result.skipped | default(false)
    - result.telemetry_status_list | length > 0


================================================
FILE: utils/credential_utility/roles/validation/tasks/validate_cred_file.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Initialize credential file status
  ansible.builtin.set_fact:
    "{{ status_var_name }}": false

- name: Check if credential file exists
  ansible.builtin.stat:
    path: "{{ credential_file_path }}"
  register: file_status

- name: Set status based on file existence
  ansible.builtin.set_fact:
    "{{ status_var_name }}": "{{ file_status.stat.exists }}"

- name: Validate credential file exists
  ansible.builtin.debug:
    msg: "Credential file {{ credential_file_path }} {{ 'exists' if file_status.stat.exists else 'does not exist' }}"
  when: file_status.stat.exists


================================================
FILE: utils/credential_utility/roles/validation/vars/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# Credential file configurations - centralized structure
credential_files:
  - credential_type: "Omnia"
    file_path: "{{ input_project_dir }}/omnia_config_credentials.yml"
    vault_path: "{{ input_project_dir }}/.omnia_config_credentials_key"
    condition: true
  - credential_type: "Build Stream"
    file_path: "{{ input_project_dir }}/build_stream_oauth_credentials.yml"
    vault_path: "{{ input_project_dir }}/.build_stream_oauth_credentials_key"
    condition: "{{ enable_build_stream | default(false) | bool }}"

# Usage: pre_requisite.yml
ansible_vault_search_key: "$ANSIBLE_VAULT;"
conf_file_mode: "0600"
software_config_file: "{{ input_project_dir }}/software_config.json"
telemetry_config_path: "{{ input_project_dir }}/telemetry_config.yml"

# Validation error messages
invalid_software_config_fail_msg: >-
  Failed. Please provide valid software_config.json file with
  cluster_os_type, cluster_os_version, repo_config and repo_config values.
software_config_syntax_fail_msg: "Failed. Syntax errors present in software_config.json. Fix errors and re-run playbook again."

# Credential validation error messages
password_fail_msg: "Failed to validate credentials file"
include_credentials_msg: "Failed to include {{ credential_file_path }}"


================================================
FILE: utils/external_kafka_connect_details.yml
================================================
#  Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Preflight - validate inventory
  hosts: localhost
  connection: local
  gather_facts: false
  tasks:
    - name: Load Kafka utility role variables
      ansible.builtin.include_vars:
        file: "{{ playbook_dir }}/roles/external_kafka_connect_details/vars/main.yml"

    - name: Include input directory
      ansible.builtin.include_role:
        name: include_input_dir

    - name: Set HA config path
      ansible.builtin.set_fact:
        k8s_ha_config_path: "{{ input_project_dir }}/high_availability_config.yml"

    - name: Load High Availability config
      ansible.builtin.include_vars:
        file: "{{ k8s_ha_config_path }}"
        name: ha_config
      failed_when: false
      register: ha_config_load

    - name: Fail when High Availability config cannot be loaded
      ansible.builtin.fail:
        msg: "{{ kafka_preflight_err_ha_config_missing }}"
      when: ha_config_load.failed

    - name: Set service kube control plane VIP from HA config
      ansible.builtin.set_fact:
        kube_vip: "{{ ha_config.service_k8s_cluster_ha[0].virtual_ip_address | default('') }}"

    - name: Fail when service kube control plane VIP is not available
      ansible.builtin.fail:
        msg: "{{ kafka_preflight_err_ha_vip_missing }}"
      when: (kube_vip | trim | length) == 0

    - name: Create service_kube_control_plane group from VIP
      ansible.builtin.add_host:
        name: "{{ kube_vip }}"
        groups: service_kube_control_plane

- name: Fetch external Kafka connection details
  hosts: service_kube_control_plane
  connection: ssh
  gather_facts: false
  roles:
    - external_kafka_connect_details


================================================
FILE: utils/external_victoria_connect_details.yml
================================================
#  Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Preflight - validate inventory
  hosts: localhost
  connection: local
  gather_facts: false
  tasks:
    - name: Load Victoria utility role variables
      ansible.builtin.include_vars:
        file: "{{ playbook_dir }}/roles/external_victoria_connect_details/vars/main.yml"

    - name: Include input directory
      ansible.builtin.include_role:
        name: include_input_dir

    - name: Set HA config path
      ansible.builtin.set_fact:
        k8s_ha_config_path: "{{ input_project_dir }}/high_availability_config.yml"

    - name: Load High Availability config
      ansible.builtin.include_vars:
        file: "{{ k8s_ha_config_path }}"
        name: ha_config
      failed_when: false
      register: ha_config_load

    - name: Fail when High Availability config cannot be loaded
      ansible.builtin.fail:
        msg: "{{ victoria_preflight_err_ha_config_missing }}"
      when: ha_config_load.failed

    - name: Set service kube control plane VIP from HA config
      ansible.builtin.set_fact:
        kube_vip: "{{ ha_config.service_k8s_cluster_ha[0].virtual_ip_address | default('') }}"

    - name: Fail when service kube control plane VIP is not available
      ansible.builtin.fail:
        msg: "{{ victoria_preflight_err_ha_vip_missing }}"
      when: (kube_vip | trim | length) == 0

    - name: Create service_kube_control_plane group from VIP
      ansible.builtin.add_host:
        name: "{{ kube_vip }}"
        groups: service_kube_control_plane

- name: Fetch external Victoria connection details
  hosts: service_kube_control_plane
  connection: ssh
  gather_facts: false
  roles:
    - external_victoria_connect_details


================================================
FILE: utils/generate_functional_groups.yml
================================================
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Include input directory
  hosts: localhost
  connection: local
  roles:
    - generate_functional_groups


================================================
FILE: utils/include_input_dir.yml
================================================
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Include input directory
  hosts: localhost
  connection: local
  roles:
    - include_input_dir


================================================
FILE: utils/oim_cleanup.yml
================================================
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Check if upgrade is in progress
  ansible.builtin.import_playbook: upgrade_checkup.yml
  tags: always

- name: Include input project directory
  when: not project_dir_status | default(false) | bool
  ansible.builtin.import_playbook: include_input_dir.yml
  tags: always

- name: Create oim group
  ansible.builtin.import_playbook: create_container_group.yml
  vars:
    oim_group: true
  tags: always

- name: Execute prerequisite tasks # noqa:role-name[path]
  hosts: localhost
  connection: local
  gather_facts: false
  roles:
    - oim_cleanup/pre_requisite
  tags: always

- name: Cleanup Omnia Infrastructure Manager # noqa:role-name[path]
  hosts: oim
  connection: ssh
  gather_facts: false
  roles:
    - oim_cleanup/oim_container_cleanup

- name: Cleanup Omnia Credentials # noqa:role-name[path]
  hosts: localhost
  connection: local
  gather_facts: false
  roles:
    - oim_cleanup/omnia_credential_cleanup # noqa:role-name[path]
  tags: credentials

- name: Show cleanup instructions
  hosts: oim
  connection: ssh
  gather_facts: false
  tasks:
    - name: Display Omnia post-cleanup notes
      ansible.builtin.include_role:
        name: oim_cleanup/oim_container_cleanup
        tasks_from: cleanup_note.yml


================================================
FILE: utils/roles/common/tasks/include_omnia_config.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Include omnia_config.yml
  block:
    - name: Include omnia_config.yml
      ansible.builtin.include_vars: "{{ omnia_config_filename }}"
      register: include_omnia_config
      no_log: true
  rescue:
    - name: Failed to include omnia_config.yml
      ansible.builtin.fail:
        msg: "{{ omnia_config_syntax_fail_msg }} Error: {{ include_omnia_config.message }}"


================================================
FILE: utils/roles/common/tasks/include_omnia_config_credentials.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Check if omnia_credential_file exists
  ansible.builtin.stat:
    path: "{{ credentials_config_filename }}"
  register: credentials_file_status

- name: Fetch omnia config credentials
  when: credentials_file_status.stat.exists
  block:
    - name: Check omnia_config_credentials.yml file is encrypted
      ansible.builtin.command: cat {{ credentials_config_filename }}
      changed_when: false
      register: file_content
      no_log: true

    - name: Decrpyt omnia_config_credentials.yml
      ansible.builtin.command: >-
        ansible-vault decrypt {{ credentials_config_filename }}
        --vault-password-file {{ credentials_vault_path }}
      changed_when: false
      when: ansible_vault_search_key in file_content.stdout

    - name: Include omnia_config_credentials.yml
      block:
        - name: Include omnia_config_credentials.yml
          ansible.builtin.include_vars: "{{ credentials_config_filename }}"
          register: include_omnia_config_credentials
          no_log: true
      rescue:
        - name: Failed to include omnia_config_credentials.yml
          ansible.builtin.fail:
            msg: "{{ credentials_config_syntax_fail_msg }} Error: {{ include_omnia_config_credentials.message }}"

    - name: Encrypt omnia_config_credentials.yml
      ansible.builtin.command: >-
        ansible-vault encrypt {{ credentials_config_filename }}
        --vault-password-file {{ credentials_vault_path }}
      changed_when: false
      when: ansible_vault_search_key in file_content.stdout

    - name: Update omnia_config_credentials.yml permission
      ansible.builtin.file:
        path: "{{ credentials_config_filename }}"
        mode: "{{ file_permission }}"


================================================
FILE: utils/roles/common/tasks/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Include omnia_config.yml
  ansible.builtin.include_tasks: include_omnia_config.yml
  tags: 'omnia_config'

- name: Include omnia_config_credentials.yml
  ansible.builtin.include_tasks: include_omnia_config_credentials.yml
  tags: 'credentials_config'

- name: Include storage_config.yml
  tags: 'storage_config'
  block:
    - name: Include storage_config.yml
      ansible.builtin.include_vars: "{{ storage_config_filename }}"
      register: include_storage_config
      no_log: true
  rescue:
    - name: Failed to include storage_config.yml
      ansible.builtin.fail:
        msg: "{{ storage_config_syntax_fail_msg }} Error: {{ include_storage_config.message }}"


================================================
FILE: utils/roles/common/vars/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# Usage: include_omnia_config.yml
omnia_config_filename: "{{ hostvars['localhost']['input_project_dir'] }}/omnia_config.yml"
ansible_vault_search_key: "$ANSIBLE_VAULT;"
omnia_config_syntax_fail_msg: "Failed. Syntax errors present in omnia_config.yml. Fix errors and re-run playbook again."
file_permission: '0644'

# Usage: include_omnia_config_credentials.yml
credentials_config_filename: "{{ hostvars['localhost']['input_project_dir'] }}/omnia_config_credentials.yml"
credentials_vault_path: "{{ hostvars['localhost']['input_project_dir'] }}/.omnia_config_credentials_key"
credentials_config_syntax_fail_msg: "Failed. Syntax errors present in omnia_config_credentials.yml. Fix errors and re-run playbook again."

storage_config_filename: "{{ hostvars['localhost']['input_project_dir'] }}/storage_config.yml"
storage_config_syntax_fail_msg: "Failed. Syntax errors present in storage_config.yml. Fix errors and re-run playbook again."

# Usage: fetch_software_config.yml
input_project_dir: "{{ hostvars['localhost']['input_project_dir'] }}"
software_config_json_file: "{{ input_project_dir }}/software_config.json"


================================================
FILE: utils/roles/create_container_group/tasks/main.yml
================================================
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Create {{ oim_host_group }} group # noqa: name[template]
  ansible.builtin.add_host:
    hostname: "{{ oim_host_group }}"
    ansible_host: "localhost"
    ansible_port: "{{ oim_host_port }}"
    groups: "{{ oim_host_group }}"
  when:
    - oim_group | default(false) | bool


================================================
FILE: utils/roles/create_container_group/vars/main.yml
================================================
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# Usage: main.yml
python_version: "python3.12"
oim_host_port: "22"
oim_host_group: "oim"


================================================
FILE: utils/roles/external_kafka_connect_details/tasks/main.yml
================================================
#  Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Validate service k8s controller connectivity
  block:
    - name: Wait for service k8s controller connection
      ansible.builtin.wait_for_connection:
        timeout: 30
  rescue:
    - name: Fail when service k8s controller is not reachable
      ansible.builtin.fail:
        msg: "{{ kafka_preflight_err_service_k8s_controller_unreachable }}"

- name: Check kubectl presence
  ansible.builtin.command: kubectl version --client=true
  register: kubectl_check
  changed_when: false
  failed_when: kubectl_check.rc != 0

- name: Delete Kafka output directory (clean start)
  ansible.builtin.file:
    path: "{{ kafka_output_dir }}"
    state: absent
  delegate_to: localhost
  connection: local
  run_once: true

- name: Get Kafka pod status
  ansible.builtin.command: >-
    kubectl get pods -n {{ kafka_namespace }}
    -l app.kubernetes.io/name=kafka
    -o wide
  register: kafka_pods
  changed_when: false
  failed_when: false

- name: Get Kafka pod status (json)
  ansible.builtin.command: >-
    kubectl get pods -n {{ kafka_namespace }}
    -l app.kubernetes.io/name=kafka
    -o json
  register: kafka_pods_json
  changed_when: false
  failed_when: kafka_pods_json.rc != 0

- name: Parse Kafka pods
  ansible.builtin.set_fact:
    kafka_pods_parsed: "{{ kafka_pods_json.stdout | from_json }}"

- name: Fail if no Kafka pods found
  ansible.builtin.fail:
    msg: "{{ kafka_err_no_pods_found }}"
  when: (kafka_pods_parsed.get('items', []) | length) == 0

- name: Fail if Kafka pods are not Running
  ansible.builtin.fail:
    msg: "{{ kafka_err_pods_not_running }}"
  when:
    - (kafka_pods_parsed.get('items', [])
      | selectattr('status.phase', 'ne', 'Running')
      | list
      | length) > 0

- name: Fail if Kafka pods are not Ready
  ansible.builtin.fail:
    msg: "{{ kafka_err_pods_not_ready }}"
  when:
    - (kafka_pods_parsed.get('items', [])
      | selectattr('status.containerStatuses', 'defined')
      | map(attribute='status.containerStatuses')
      | list
      | flatten
      | selectattr('ready', 'equalto', false)
      | list
      | length) > 0

- name: Get Kafka LoadBalancer IP
  ansible.builtin.command: >-
    kubectl get svc {{ kafka_lb_service_name }} -n {{ kafka_namespace }}
    -o jsonpath='{.status.loadBalancer.ingress[0].ip}'
  register: kafka_lb_ip
  changed_when: false
  failed_when: kafka_lb_ip.rc != 0

- name: Set Kafka external endpoint
  ansible.builtin.set_fact:
    kafka_external_ip: "{{ kafka_lb_ip.stdout | trim }}"
    kafka_external_port: "{{ kafka_bootstrap_port | string }}"

- name: Fail when Kafka external endpoint is not available
  ansible.builtin.fail:
    msg: "{{ kafka_err_external_ip_missing }}"
  when: kafka_external_ip | trim | length == 0

- name: Ensure output directory exists
  ansible.builtin.file:
    path: "{{ kafka_output_dir }}"
    state: directory
    mode: "0755"
  delegate_to: localhost
  connection: local
  run_once: true

- name: Read Kafka cluster CA cert from secret
  ansible.builtin.command: >-
    kubectl get secret {{ kafka_cluster_ca_secret }} -n {{ kafka_namespace }}
    -o jsonpath='{.data.ca\.crt}'
  register: kafka_ca_crt_b64
  changed_when: false
  failed_when: kafka_ca_crt_b64.rc != 0 or (kafka_ca_crt_b64.stdout | trim | length == 0)

- name: Read Kafka client cert from secret
  ansible.builtin.command: >-
    kubectl get secret {{ kafka_client_secret }} -n {{ kafka_namespace }}
    -o jsonpath='{.data.user\.crt}'
  register: kafka_user_crt_b64
  changed_when: false
  failed_when: kafka_user_crt_b64.rc != 0 or (kafka_user_crt_b64.stdout | trim | length == 0)

- name: Read Kafka client key from secret
  ansible.builtin.command: >-
    kubectl get secret {{ kafka_client_secret }} -n {{ kafka_namespace }}
    -o jsonpath='{.data.user\.key}'
  register: kafka_user_key_b64
  changed_when: false
  failed_when: kafka_user_key_b64.rc != 0 or (kafka_user_key_b64.stdout | trim | length == 0)

- name: Write Kafka CA/cert/key files
  ansible.builtin.copy:
    content: "{{ item.content }}"
    dest: "{{ item.dest }}"
    mode: "0600"
  loop:
    - dest: "{{ kafka_output_dir }}/ca.crt"
      content: "{{ kafka_ca_crt_b64.stdout | b64decode }}"
    - dest: "{{ kafka_output_dir }}/user.crt"
      content: "{{ kafka_user_crt_b64.stdout | b64decode }}"
    - dest: "{{ kafka_output_dir }}/user.key"
      content: "{{ kafka_user_key_b64.stdout | b64decode }}"
  delegate_to: localhost
  connection: local
  run_once: true

- name: Build Kafka connection details
  ansible.builtin.set_fact:
    kafka_connect_details:
      kafka:
        namespace: "{{ kafka_namespace }}"
        loadbalancer_service: "{{ kafka_lb_service_name }}"
        pod_status: "{{ kafka_pods.stdout | default('') }}"
        bootstrap_server: "{{ kafka_external_ip }}:{{ kafka_external_port }}"
        tls:
          ca_crt: "{{ kafka_output_dir }}/ca.crt"
          client_crt: "{{ kafka_output_dir }}/user.crt"
          client_key: "{{ kafka_output_dir }}/user.key"

- name: Ensure output file directory exists
  ansible.builtin.file:
    path: "{{ kafka_output_file | dirname }}"
    state: directory
    mode: "0755"
  delegate_to: localhost
  connection: local
  run_once: true

- name: Write Kafka connection details to file
  ansible.builtin.copy:
    content: "{{ kafka_connect_details | to_nice_yaml }}"
    dest: "{{ kafka_output_file }}"
    mode: "0644"
  delegate_to: localhost
  connection: local
  run_once: true

- name: Display Kafka connection details
  ansible.builtin.debug:
    msg: >-
      {{
        [
          'Kafka connection details written to: ' ~ kafka_output_file,
          '',
          '[IMPORTANT] Kafka external endpoint: ' ~ kafka_external_ip ~ ':' ~ kafka_external_port,
          '',
          '[IMPORTANT] TLS files (on OIM host):',
          '  CA (server certificate for OME): ' ~ kafka_output_dir ~ '/ca.crt',
          '  client cert: ' ~ kafka_output_dir ~ '/user.crt',
          '  client key:  ' ~ kafka_output_dir ~ '/user.key',
          '',
          'OME steps (mTLS):',
          '  [STEP 1] Create client certificate in .pfx format (passphrase required):',
          '           cd ' ~ kafka_output_dir,
          '           openssl pkcs12 -export -out user.pfx -inkey user.key -in user.crt',
          '  [STEP 2] ' ~ kafka_ome_cross_machine_note_line1,
          '           ' ~ kafka_ome_cross_machine_note_line2,
          '  [STEP 3] In the OME UI, navigate to:',
          '           ' ~ kafka_ome_ui_navigation_line1,
          '  [STEP 4] Click: ' ~ kafka_ome_ui_enable_label,
          '  [STEP 5] Set Kafka Bootstrap Server to: ' ~ kafka_external_ip ~ ':' ~ kafka_external_port,
          '  [STEP 6] Set Authentication Mode to: ' ~ kafka_ome_auth_mode_value,
          '  [STEP 7] ' ~ kafka_ome_server_cert_note,
          '  [STEP 8] ' ~ kafka_ome_client_cert_note,
          ''
        ]
      }}
  delegate_to: localhost
  connection: local
  run_once: true


================================================
FILE: utils/roles/external_kafka_connect_details/vars/main.yml
================================================
#  Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

kafka_namespace: "telemetry"
kafka_lb_service_name: "kafka-kafka-external-bootstrap"
kafka_bootstrap_port: 9094
kafka_cluster_ca_secret: "kafka-cluster-ca-cert"
kafka_client_secret: "kafkapump"
kafka_output_dir: "/opt/omnia/telemetry/external_kafka"
kafka_output_file: "/opt/omnia/telemetry/external_kafka_connect_details.yml"

kafka_err_no_pods_found: "No Kafka pods found in namespace '{{ kafka_namespace }}'."
kafka_err_pods_not_running: "One or more Kafka pods are not in Running state."
kafka_err_pods_not_ready: "One or more Kafka pods are not Ready."

kafka_err_external_ip_missing: >-
  Failed to fetch Kafka LoadBalancer external IP. Ensure service '{{ kafka_lb_service_name }}'
  exists in namespace '{{ kafka_namespace }}' and has an external IP assigned.

kafka_preflight_err_ha_config_missing: >-
  Failed to load High Availability config file: {{ k8s_ha_config_path }}.
  Provide a valid HA config so the service Kubernetes VIP can be used.

kafka_preflight_err_ha_vip_missing: >-
  Failed to determine the service Kubernetes control plane VIP from High Availability config.
  Ensure service_k8s_cluster_ha[0].virtual_ip_address is set in: {{ k8s_ha_config_path }}.

kafka_preflight_err_service_k8s_controller_unreachable: >-
  Service Kubernetes controller is not reachable over SSH: {{ ansible_host | default(inventory_hostname) }}.
  Ensure the service Kubernetes VIP is reachable and resolvable from the OIM host.

kafka_ome_ui_navigation_line1: "Configuration -> Remote Connectivity"
kafka_ome_ui_enable_label: "Enable Kafka Connectivity"
kafka_ome_auth_mode_value: "SSL"

kafka_ome_server_cert_note: "Upload ca.crt as the server certificate in OME."
kafka_ome_client_cert_note: "Upload user.pfx as the client certificate in OME (mTLS)."
kafka_ome_cross_machine_note_line1: >-
  If OME UI is accessed from a different system than the OIM host,
kafka_ome_cross_machine_note_line2: >-
  copy ca.crt and user.pfx to that system before uploading them in the UI.


================================================
FILE: utils/roles/external_victoria_connect_details/tasks/main.yml
================================================
#  Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Validate service k8s controller connectivity
  block:
    - name: Wait for service k8s controller connection
      ansible.builtin.wait_for_connection:
        timeout: 30
  rescue:
    - name: Fail when service k8s controller is not reachable
      ansible.builtin.fail:
        msg: "{{ victoria_preflight_err_service_k8s_controller_unreachable }}"

- name: Check kubectl presence
  ansible.builtin.command: kubectl version --client=true
  register: kubectl_check
  changed_when: false
  failed_when: kubectl_check.rc != 0

- name: Check for Victoria cluster services
  ansible.builtin.command: >-
    kubectl get svc {{ item }} -n {{ victoria_namespace }} -o name
  loop:
    - vminsert
    - vmselect
  register: victoria_cluster_svcs
  changed_when: false
  failed_when: false

- name: Check for Victoria single-node service
  ansible.builtin.command: >-
    kubectl get svc victoria-loadbalancer -n {{ victoria_namespace }} -o name
  register: victoria_single_svc
  changed_when: false
  failed_when: false

- name: Set Victoria deployment mode
  ansible.builtin.set_fact:
    victoria_deployment_mode: >-
      {{
        'cluster'
        if (victoria_cluster_svcs.results | selectattr('rc', 'equalto', 0) | list | length) == 2
        else ('single-node' if victoria_single_svc.rc == 0 else 'unknown')
      }}

- name: Fail if Victoria cluster mode is not deployed
  ansible.builtin.fail:
    msg: "{{ victoria_err_mode_not_supported }}"
  when: victoria_deployment_mode != 'cluster'

- name: Get Victoria pods status
  ansible.builtin.command: >-
    kubectl get pods -n {{ victoria_namespace }}
    -l "app in (vminsert,vmselect,vmstorage,victoriametrics)"
    -o wide
  register: victoria_pods_wide
  changed_when: false
  failed_when: victoria_pods_wide.rc != 0

- name: Get Victoria pods status (json)
  ansible.builtin.command: >-
    kubectl get pods -n {{ victoria_namespace }}
    -l "app in (vminsert,vmselect,vmstorage,victoriametrics)"
    -o json
  register: victoria_pods_json
  changed_when: false
  failed_when: victoria_pods_json.rc != 0

- name: Parse Victoria pods
  ansible.builtin.set_fact:
    victoria_pods_parsed: "{{ victoria_pods_json.stdout | from_json }}"

- name: Fail if no Victoria pods found
  ansible.builtin.fail:
    msg: "{{ victoria_err_no_pods_found }}"
  when: (victoria_pods_parsed.get('items', []) | length) == 0

- name: Fail if Victoria pods are not Running
  ansible.builtin.fail:
    msg: "{{ victoria_err_pods_not_running }}"
  when:
    - (victoria_pods_parsed.get('items', [])
      | selectattr('status.phase', 'ne', 'Running')
      | list
      | length) > 0

- name: Fail if Victoria pods are not Ready
  ansible.builtin.fail:
    msg: "{{ victoria_err_pods_not_ready }}"
  when:
    - (victoria_pods_parsed.get('items', [])
      | selectattr('status.containerStatuses', 'defined')
      | map(attribute='status.containerStatuses')
      | list
      | flatten
      | selectattr('ready', 'equalto', false)
      | list
      | length) > 0

- name: Get vminsert service LoadBalancer IP
  ansible.builtin.command: >-
    kubectl get svc vminsert -n {{ victoria_namespace }}
    -o jsonpath='{.status.loadBalancer.ingress[0].ip}'
  register: vminsert_lb_ip
  changed_when: false
  failed_when: vminsert_lb_ip.rc != 0

- name: Get vminsert service LoadBalancer hostname
  ansible.builtin.command: >-
    kubectl get svc vminsert -n {{ victoria_namespace }}
    -o jsonpath='{.status.loadBalancer.ingress[0].hostname}'
  register: vminsert_lb_hostname
  changed_when: false
  failed_when: vminsert_lb_hostname.rc != 0

- name: Get vminsert service external port
  ansible.builtin.command: >-
    kubectl get svc vminsert -n {{ victoria_namespace }}
    -o jsonpath='{.spec.ports[0].port}'
  register: vminsert_lb_port
  changed_when: false
  failed_when: vminsert_lb_port.rc != 0

- name: Get vmselect service LoadBalancer IP
  ansible.builtin.command: >-
    kubectl get svc vmselect -n {{ victoria_namespace }}
    -o jsonpath='{.status.loadBalancer.ingress[0].ip}'
  register: vmselect_lb_ip
  changed_when: false
  failed_when: vmselect_lb_ip.rc != 0

- name: Get vmselect service LoadBalancer hostname
  ansible.builtin.command: >-
    kubectl get svc vmselect -n {{ victoria_namespace }}
    -o jsonpath='{.status.loadBalancer.ingress[0].hostname}'
  register: vmselect_lb_hostname
  changed_when: false
  failed_when: vmselect_lb_hostname.rc != 0

- name: Get vmselect service external port
  ansible.builtin.command: >-
    kubectl get svc vmselect -n {{ victoria_namespace }}
    -o jsonpath='{.spec.ports[0].port}'
  register: vmselect_lb_port
  changed_when: false
  failed_when: vmselect_lb_port.rc != 0

- name: Set endpoint facts
  ansible.builtin.set_fact:
    vminsert_host: >-
      {{
        (vminsert_lb_ip.stdout | trim)
        if (vminsert_lb_ip.stdout | trim | length) > 0
        else (vminsert_lb_hostname.stdout | trim)
      }}
    vmselect_host: >-
      {{
        (vmselect_lb_ip.stdout | trim)
        if (vmselect_lb_ip.stdout | trim | length) > 0
        else (vmselect_lb_hostname.stdout | trim)
      }}
    vminsert_port: "{{ (vminsert_lb_port.stdout | trim) | default('') }}"
    vmselect_port: "{{ (vmselect_lb_port.stdout | trim) | default('') }}"
    victoria_tls_ca: "{{ victoria_tls_cert_dir }}/ca.crt"

- name: Fail when LoadBalancer IPs are not available
  ansible.builtin.fail:
    msg: "{{ victoria_err_lb_missing }}"
  when:
    - vminsert_host | trim | length == 0 or vmselect_host | trim | length == 0

- name: Build SFM hosts entry
  ansible.builtin.set_fact:
    victoria_sfm_hosts_entry: >-
      {{
        'echo ' ~ (vminsert_lb_ip.stdout | trim) ~ ' vminsert.' ~ victoria_namespace ~ '.svc.cluster.local >> /etc/hosts'
        if (vminsert_lb_ip.stdout | trim | length) > 0
        else ''
      }}

- name: Build SFM hosts entry for vmselect
  ansible.builtin.set_fact:
    victoria_sfm_hosts_entry_vmselect: >-
      {{
        'echo ' ~ (vmselect_lb_ip.stdout | trim) ~ ' vmselect.' ~ victoria_namespace ~ '.svc.cluster.local >> /etc/hosts'
        if (vmselect_lb_ip.stdout | trim | length) > 0
        else ''
      }}

- name: Set endpoint urls and SFM note strings
  ansible.builtin.set_fact:
    victoria_vminsert_write_url: >-
      https://vminsert.{{ victoria_namespace }}.svc.cluster.local:8480/insert/0/prometheus/api/v1/write
    victoria_vmselect_query_url: >-
      https://vmselect.{{ victoria_namespace }}.svc.cluster.local:8481/select/0/prometheus/api/v1/query
    victoria_vmselect_ui_url: >-
      https://vmselect.{{ victoria_namespace }}.svc.cluster.local:8481/select/0/vmui
    victoria_sfm_hosts_entry_vminsert_display: >-
      {{
        victoria_sfm_hosts_entry
        if (victoria_sfm_hosts_entry | length) > 0
        else 'vminsert LoadBalancer IP not available; cannot generate /etc/hosts entry.'
      }}
    victoria_sfm_hosts_entry_vmselect_display: >-
      {{
        victoria_sfm_hosts_entry_vmselect
        if (victoria_sfm_hosts_entry_vmselect | length) > 0
        else 'vmselect LoadBalancer IP not available; cannot generate /etc/hosts entry.'
      }}

- name: Set Victoria external port fallbacks
  ansible.builtin.set_fact:
    vminsert_port: "8480"
    vmselect_port: "8481"
  when:
    - vminsert_port | trim | length == 0 or vmselect_port | trim | length == 0

- name: Build connection details
  ansible.builtin.set_fact:
    victoria_connect_details:
      victoria:
        namespace: "{{ victoria_namespace }}"
        deployment_mode: "{{ victoria_deployment_mode }}"
        pod_status: "{{ victoria_pods_wide.stdout }}"
        base_url: "https://{{ vminsert_host }}:{{ vminsert_port }}"
        endpoints:
          vminsert:
            host: "{{ vminsert_host }}"
            port: "{{ vminsert_port | int }}"
            write_endpoint: "https://{{ vminsert_host }}:{{ vminsert_port }}/insert/0/prometheus/api/v1/write"
          vmselect:
            host: "{{ vmselect_host }}"
            port: "{{ vmselect_port | int }}"
            query_endpoint: "https://{{ vmselect_host }}:{{ vmselect_port }}/select/0/prometheus/api/v1/query"
            ui_url: "https://{{ vmselect_host }}:{{ vmselect_port }}/select/0/vmui"
        tls:
          ca_crt: "{{ victoria_tls_ca }}"
        notes:
          sfm:
            vminsert_write_url: "{{ victoria_vminsert_write_url }}"
            hosts_entry: "{{ victoria_sfm_hosts_entry }}"
            hosts_entry_vmselect: "{{ victoria_sfm_hosts_entry_vmselect }}"
            ui_navigation: "{{ victoria_sfm_ui_navigation }}"
            remote_write_target_name: "{{ victoria_sfm_remote_write_target_name }}"
            remote_write_message_version: "{{ victoria_sfm_remote_write_message_version }}"
            remote_write_enable_value: "{{ victoria_sfm_remote_write_enable_value }}"
            tls_server_cert_file_name: "{{ victoria_sfm_tls_server_cert_file_name }}"
            tls_server_cert_file_path: "{{ victoria_tls_ca }}"
            ssh_note: "{{ victoria_sfm_ssh_note }}"
            hosts_scope_note: "{{ victoria_sfm_hosts_scope_note }}"
            pod_shell_command_example: "{{ victoria_sfm_pod_shell_command_example }}"
            hosts_restart_note: "{{ victoria_sfm_hosts_restart_note }}"

- name: Ensure output directory exists
  ansible.builtin.file:
    path: "{{ victoria_output_file | dirname }}"
    state: directory
    mode: "0755"
  delegate_to: localhost
  connection: local
  run_once: true

- name: Write connection details to file
  ansible.builtin.copy:
    content: "{{ victoria_connect_details | to_nice_yaml }}"
    dest: "{{ victoria_output_file }}"
    mode: "0644"
  delegate_to: localhost
  connection: local
  run_once: true

- name: Display Victoria connection details
  ansible.builtin.debug:
    msg: >-
      {{
        [
          'Victoria connection details written to: ' ~ victoria_output_file,
          '',
          'Mode: ' ~ victoria_deployment_mode,
          '',
          'Endpoints:',
          '  [IMPORTANT] vminsert write: ' ~ victoria_vminsert_write_url,
          '  vmselect query: ' ~ victoria_vmselect_query_url,
          '  vmselect UI:    ' ~ victoria_vmselect_ui_url,
          '',
          'TLS:',
          '  ca.crt:     ' ~ victoria_tls_ca,
          '',
          'SFM steps (TLS):',
          '  [STEP 1] ' ~ victoria_sfm_cross_machine_tls_note_line1,
          '           ' ~ victoria_sfm_cross_machine_tls_note_line2,
          '  [STEP 2] In the SFM UI, update the vminsert URL:',
          '           ' ~ victoria_sfm_ui_navigation,
          '           Edit target: ' ~ victoria_sfm_remote_write_target_name,
          '           Set Enable to: ' ~ victoria_sfm_remote_write_enable_value,
          '           Set URL to: ' ~ victoria_vminsert_write_url,
          '           Set Message Version to: ' ~ victoria_sfm_remote_write_message_version,
          '           TLS Config: Upload ' ~ victoria_sfm_tls_server_cert_file_name,
          '                      as ' ~ victoria_sfm_tls_server_cert_file_label ~ ': ' ~ victoria_tls_ca,
          '  [STEP 3] ' ~ victoria_sfm_ssh_note,
          '  [STEP 4] Update /etc/hosts only inside the SFM Prometheus pod:',
          '           ' ~ victoria_sfm_hosts_scope_note,
          '           ' ~ victoria_sfm_pod_shell_command_example,
          '           Add these entries inside the pod:',
          '             ' ~ victoria_sfm_hosts_entry_vminsert_display,
          '             ' ~ victoria_sfm_hosts_entry_vmselect_display,
          '  [NOTE] ' ~ victoria_sfm_hosts_restart_note,
          ''
        ]
      }}
  delegate_to: localhost
  connection: local
  run_once: true


================================================
FILE: utils/roles/external_victoria_connect_details/vars/main.yml
================================================
#  Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

victoria_namespace: "telemetry"
victoria_output_file: "/opt/omnia/telemetry/external_victoria_connect_details.yml"
victoria_tls_cert_dir: "/opt/omnia/telemetry/victoria-certs"

victoria_err_mode_not_supported: >-
  Victoria deployment mode detected: {{ victoria_deployment_mode }}.
  External integration is supported only for Victoria cluster mode (vminsert/vmselect/vmstorage).
  Single-node Victoria (victoria-loadbalancer) is not supported for external integration.

victoria_err_no_pods_found: "No Victoria pods found in namespace '{{ victoria_namespace }}'."
victoria_err_pods_not_running: "One or more Victoria pods are not in Running state."
victoria_err_pods_not_ready: "One or more Victoria pods are not Ready."

victoria_err_lb_missing: >-
  Failed to fetch Victoria LoadBalancer IP(s). Ensure services 'vminsert' and 'vmselect'
  exist in namespace '{{ victoria_namespace }}' and have external IPs assigned.

victoria_preflight_err_ha_config_missing: >-
  Failed to load High Availability config file: {{ k8s_ha_config_path }}.
  Provide a valid HA config so the service Kubernetes VIP can be used.

victoria_preflight_err_ha_vip_missing: >-
  Failed to determine the service Kubernetes control plane VIP from High Availability config.
  Ensure service_k8s_cluster_ha[0].virtual_ip_address is set in: {{ k8s_ha_config_path }}.

victoria_preflight_err_service_k8s_controller_unreachable: >-
  Service Kubernetes controller is not reachable over SSH: {{ ansible_host | default(inventory_hostname) }}.
  Ensure the service Kubernetes VIP is reachable and resolvable from the OIM host.

victoria_sfm_ui_navigation: "Observability -> Settings -> Prometheus Remote Write"
victoria_sfm_remote_write_target_name: "victoria"
victoria_sfm_remote_write_message_version: "v1"
victoria_sfm_remote_write_enable_value: "ON"

victoria_sfm_ssh_note: "SSH to the SFM IP with admin credentials."
victoria_sfm_hosts_scope_note: >-
  /etc/hosts update is required only inside the SFM Prometheus pod (not on the SFM server host).
victoria_sfm_pod_shell_command_example: >-
  kubectl exec -it sfm-prometheus-deployment-xxxxx-xx -n sfm-1 -- /bin/sh
victoria_sfm_hosts_restart_note: "Repeat /etc/hosts update if the SFM pod restarts."
victoria_sfm_cross_machine_tls_note_line1: >-
  If using the SFM UI from a different system than the OIM host,
victoria_sfm_cross_machine_tls_note_line2: >-
  copy ca.crt to that system before uploading it in the UI.

victoria_sfm_tls_server_cert_file_label: "Server Certificate File"
victoria_sfm_tls_server_cert_file_name: "ca.crt"


================================================
FILE: utils/roles/generate_functional_groups/tasks/main.yml
================================================
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---


- name: Include vars from provision_config.yml
  ansible.builtin.include_vars:
    file: "{{ input_project_dir }}/{{ provision_config_file }}"

- name: Set fact for functional groups file path
  ansible.builtin.set_fact:
    functional_groups_config_path: "{{ functional_groups_config_path }}"

- name: Generate functional groups from mapping.csv
  generate_functional_groups:
    mapping_file_path: "{{ pxe_mapping_file_path }}"
    functional_groups_file_path: "{{ functional_groups_config_path }}"
    omnia_config_path: "{{ input_project_dir }}/{{ omnia_config_file }}"

- name: Check the functional_groups_config.yml file is created in /opt/omnia/.data
  ansible.builtin.stat:
    path: "{{ functional_groups_config_path }}"
  register: functional_groups_file

- name: Fail if functional groups file is not created
  ansible.builtin.fail:
    msg: "Failed to create functional groups file at {{ functional_groups_config_path }}"
  when: not functional_groups_file.stat.exists


================================================
FILE: utils/roles/generate_functional_groups/vars/main.yml
================================================
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

provision_config_file: "provision_config.yml"
omnia_config_file: "omnia_config.yml"
functional_groups_config_path: "/opt/omnia/.data/functional_groups_config.yml"


================================================
FILE: utils/roles/idrac_pxe_boot/tasks/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
- name: Show status of the Lifecycle Controller
  dellemc.openmanage.idrac_lifecycle_controller_status_info:
    idrac_ip: "{{ inventory_hostname }}"
    idrac_user: "{{ bmc_username | default(hostvars['localhost']['bmc_username']) }}"
    idrac_password: "{{ bmc_password | default(hostvars['localhost']['bmc_password']) }}"
    validate_certs: false
  register: lc_check_status
  until:
    - lc_check_status.lc_status_info.LCReady is defined
    - lc_check_status.lc_status_info.LCReady
  retries: 3
  delay: 5
  # ignore_errors: true
  # free startegy should be used to avoid blocking on failed hosts
  # but issue will be summarizing/syncing summary report of all at the end

- name: IDRAC ops when ready
  when:
    - lc_check_status is success
    - lc_check_status.lc_status_info.LCReady
  block:
    - name: Set boot option from pxe
      dellemc.openmanage.idrac_boot:
        idrac_ip: "{{ inventory_hostname }}"
        idrac_user: "{{ bmc_username | default(hostvars['localhost']['bmc_username']) }}"
        idrac_password: "{{ bmc_password | default(hostvars['localhost']['bmc_password']) }}"
        validate_certs: false
        boot_source_override_mode: uefi
        boot_source_override_target: "{{ boot_source_override_target }}"
        boot_source_override_enabled: "{{ boot_source_override_enabled }}"
        reset_type: "none" # Dont Restart here as to Handle poweroff case
      register: pxe_provisioning
      ignore_errors: true
      ignore_unreachable: true

    - name: Try ForceRestart
      dellemc.openmanage.redfish_powerstate:
        baseuri: "{{ inventory_hostname }}"
        username: "{{ bmc_username | default(hostvars['localhost']['bmc_username']) }}"
        password: "{{ bmc_password | default(hostvars['localhost']['bmc_password']) }}"
        validate_certs: false
        reset_type: "{{ 'ForceRestart' if force_restart else 'GracefulRestart' }}"
      when: restart_host
      register: restart_op
      failed_when: false

    - name: Try On if ForceRestart did not change
      dellemc.openmanage.redfish_powerstate:
        baseuri: "{{ inventory_hostname }}"
        username: "{{ bmc_username | default(hostvars['localhost']['bmc_username']) }}"
        password: "{{ bmc_password | default(hostvars['localhost']['bmc_password']) }}"
        validate_certs: false
        reset_type: "On"
      register: power_on_op
      failed_when: false
      when:
        - restart_host
        - not (restart_op is changed)

- name: Check LC availibility
  ansible.builtin.set_fact:
    reboot_failed: true
    reboot_status: "{{ lc_check_fail_msg }}"
  when: lc_check_status is unreachable or lc_check_status is failed or not (lc_check_status.lc_status_info.LCReady | default(false))

- name: Fail if PXE provisioning failed
  ansible.builtin.set_fact:
    reboot_failed: true
    reboot_status: "{{ pxe_provisioning_fail_msg }}"
  when:
    - not reboot_failed
    - pxe_provisioning is defined
    - pxe_provisioning is failed

- name: Fail if PXE provisioning target is unreachable
  ansible.builtin.set_fact:
    reboot_failed: true
    reboot_status: "{{ unreachable_idrac_msg }}"
  when:
    - not reboot_failed
    - pxe_provisioning is defined
    - pxe_provisioning is unreachable

- name: Fail if power operation failed
  ansible.builtin.set_fact:
    reboot_failed: true
    reboot_status: "Power operation failed on {{ inventory_hostname }}. Failed to restart server."
  when:
    - not reboot_failed
    - restart_host
    - not (restart_op is defined and restart_op is changed)
    - not (power_on_op is defined and power_on_op is changed)

- name: Summarize PXE boot and power operation results
  ansible.builtin.set_fact:
    reboot_failed: false
    reboot_status: >-
      PXE Boot: {{ 'OK' if pxe_provisioning is success else ('UNREACHABLE' if pxe_provisioning is unreachable else 'FAILED') }} |
      Power: {{ 'Restart OK' if (restart_op is defined and restart_op is changed)
      else ('On OK' if (power_on_op is defined and power_on_op is changed)
      else ('Skipped (no restart)' if not restart_host
      else 'FAILED')) }}
  when: not reboot_failed


================================================
FILE: utils/roles/idrac_pxe_boot/vars/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
# Change to false for not restarting host. only setting pxe_boot will happen
restart_host: true

# Change to true for forceful reboot. by default graceful will happen
force_restart: true

reboot_status: "PXE boot initiated but not completed."
reboot_failed: false

# Set boot source override mode. Valid values are once, continuous, or disabled
boot_source_override_enabled: continuous

# Set boot source override target. Valid values are pxe,uefi_http,sd_card,uefi_target,utilities,bios_setup,hdd,cd,floppy,none
boot_source_override_target: pxe

# Usage: main.yml
lc_check_fail_msg: "Failed. iDRAC is not ready. Retry again after iDRAC is ready"
provision_os_msg: "OS provisioning is initiated. Wait for installation to complete for all servers."
pxe_provisioning_fail_msg: "OS booting using PXE failed. This could be due to outdated NIC firmware. Re-run set_pxe_boot.yml after fixing the issue"
bmc_validation_fail_msg: "Failed. bmc group in inventory must have atleast one bmc ip."
unreachable_idrac_msg: "iDRAC is unreachable. pxe boot might be set. Please check the host reboot status manually"


================================================
FILE: utils/roles/include_input_dir/tasks/main.yml
================================================
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Fetch omnia project configs
  block:
    - name: Include omnia project config file
      ansible.builtin.include_vars: "{{ omnia_input_config_file }}"
      register: include_omnia_config
  rescue:
    - name: Failed to include omnia project config file
      ansible.builtin.fail:
        msg: "{{ omnia_input_config_syntax_fail_msg }} Error: {{ include_omnia_config.message }}"

- name: Set input_project_dir
  ansible.builtin.set_fact:
    input_project_dir: "{{ omnia_input_dir }}/{{ project_name }}"

- name: Verify the project directory exists
  ansible.builtin.stat:
    path: "{{ input_project_dir }}"
  register: verify_project_dir

- name: Fail if project directory does not exist
  ansible.builtin.fail:
    msg: "{{ project_dir_not_exist_fail_msg }}"
  when: not verify_project_dir.stat

- name: Include common vars
  ansible.builtin.include_vars: "{{ role_path }}/../../../common/vars/common_vars.yml"

- name: Include openchami vars
  ansible.builtin.include_vars: "{{ role_path }}/../../../common/vars/openchami_vars.yml"
  when: openchami_vars_suppport | default(false)

- name: Include oim metadata vars
  ansible.builtin.include_vars: "{{ omnia_metadata_file_path }}"
  when: omnia_metadata_support | default(false)


================================================
FILE: utils/roles/include_input_dir/vars/main.yml
================================================
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

# Usage: main.yml
omnia_input_dir: /opt/omnia/input
omnia_input_config_file: "{{ omnia_input_dir }}/default.yml"
omnia_metadata_file_path: "/opt/omnia/.data/oim_metadata.yml"
omnia_input_config_syntax_fail_msg: |
  "Unable to load the Omnia project configuration file at {{ omnia_input_config_file }}.
  Please ensure the file exists and has valid YAML syntax before re-running the playbook."
project_dir_not_exist_fail_msg: |
  "The project directory at {{ input_project_dir }} does not exist.
  Please ensure the directory exists before re-running the playbook."


================================================
FILE: utils/roles/oim_cleanup/oim_container_cleanup/tasks/cleanup_auth.yml
================================================
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
- name: Reload systemd daemon
  ansible.builtin.systemd:
    daemon_reload: true

- name: Populate service facts
  ansible.builtin.service_facts:

- name: Select only the omnia_auth service name
  ansible.builtin.set_fact:
    auth_services: "{{ ansible_facts['services'].keys() | select('match', '^omnia_auth') | list }}"

- name: Stop all matching omnia_auth services
  ansible.builtin.systemd_service:
    name: "{{ item }}"
    state: stopped
  loop: "{{ auth_services }}"
  when:
    - item in ansible_facts.services
    - ansible_facts.services[item].state == 'running'

- name: Get omnia_auth container files
  ansible.builtin.find:
    paths: "/etc/containers/systemd/"
    patterns: 'omnia_auth*'
    file_type: file
  register: found_files

- name: Get the list of omnia auth paths
  ansible.builtin.set_fact:
    auth_quad_path_list: "{{ found_files.files | map(attribute='path') | list }}"

- name: Remove omnia_auth systemd unit files
  ansible.builtin.file:
    path: "{{ item }}"
    state: absent
  loop: "{{ auth_quad_path_list }}"

- name: Reload systemd daemon
  ansible.builtin.systemd:
    daemon_reload: true

- name: Get podman info for omnia_auth container
  containers.podman.podman_container_info:
    name: "{{ auth_service_container_name }}"
  register: podmen
  no_log: true

- name: Get info about omnia_auth
  containers.podman.podman_container_info:
    name: "{{ auth_service_container_name }}"
  register: podinfo
  failed_when: false  # Do not fail if container doesn't exist

- name: Stop auth service only if it exists
  containers.podman.podman_container:
    name: "{{ auth_service_container_name }}"
    state: stopped
  when: podinfo.containers | length > 0

- name: Remove omnia_auth containers
  containers.podman.podman_container:
    name: "{{ auth_service_container_name }}"
    state: absent
    force_delete: true
  when: podinfo.containers | length > 0

- name: Remove auth cleanup directories
  ansible.builtin.file:
    path: "{{ item }}"
    state: absent
    force: true
  register: directory_deletion
  until: directory_deletion is not failed
  retries: "{{ max_retries }}"
  loop: "{{ auth_cleanup_directory }}"

- name: Check if target file exists
  ansible.builtin.stat:
    path: "{{ omnia_target }}"
  register: p

- name: Remove all omnia_auth services
  ansible.builtin.replace:
    path: "{{ omnia_target }}"
    regexp: "{{ auth_service_container_name }}"
    replace: ''
  when: p.stat.exists


================================================
FILE: utils/roles/oim_cleanup/oim_container_cleanup/tasks/cleanup_build_stream.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Reload systemd daemon
  ansible.builtin.systemd:
    daemon_reload: true

- name: Populate service facts
  ansible.builtin.service_facts:

- name: Select only the omnia_build_stream service name
  ansible.builtin.set_fact:
    build_stream_services: "{{ ansible_facts['services'].keys() | select('match', '^omnia_build_stream') | list }}"

- name: Stop all matching omnia_build_stream services
  ansible.builtin.systemd_service:
    name: "{{ item }}"
    state: stopped
  failed_when: false
  loop: "{{ build_stream_services }}"
  when:
    - item in ansible_facts.services
    - ansible_facts.services[item].state == 'running'

- name: Get omnia_build_stream container files
  ansible.builtin.find:
    paths: "{{ quadlet_dir }}"
    patterns: 'omnia_build_stream*'
    file_type: file
  register: found_files

- name: Get the list of omnia build_stream paths
  ansible.builtin.set_fact:
    build_stream_quad_path_list: "{{ found_files.files | map(attribute='path') | list }}"

- name: Remove omnia_build_stream systemd unit files
  ansible.builtin.file:
    path: "{{ item }}"
    state: absent
  loop: "{{ build_stream_quad_path_list }}"

- name: Stop playbook_watcher service if it exists
  ansible.builtin.systemd_service:
    name: playbook_watcher.service
    state: stopped
  failed_when: false
  when:
    - ("playbook_watcher.service" in ansible_facts.services)
    - ansible_facts.services['playbook_watcher.service'].state == 'running'

- name: Disable playbook_watcher service
  ansible.builtin.systemd_service:
    name: playbook_watcher.service
    enabled: false
  failed_when: false
  when: ("playbook_watcher.service" in ansible_facts.services)

- name: Remove playbook_watcher service file
  ansible.builtin.file:
    path: "{{ playbook_watcher_service_file }}"
    state: absent

- name: Reload systemd daemon
  ansible.builtin.systemd:
    daemon_reload: true

- name: Get info about omnia_build_stream container
  containers.podman.podman_container_info:
    name: "{{ build_stream_container_name }}"
  register: podinfo
  failed_when: false

- name: Stop build_stream container only if it exists
  containers.podman.podman_container:
    name: "{{ build_stream_container_name }}"
    state: stopped
  when: podinfo.containers | length > 0

- name: Remove omnia_build_stream containers
  containers.podman.podman_container:
    name: "{{ build_stream_container_name }}"
    state: absent
    force_delete: true
  when: podinfo.containers | length > 0

- name: Remove build_stream cleanup directories
  block:
    - name: Remove each build_stream cleanup directory
      ansible.builtin.file:
        path: "{{ item }}"
        state: absent
        force: true
      register: directory_deletion
      until: directory_deletion is not failed
      retries: "{{ max_retries }}"
      loop: "{{ build_stream_cleanup_directory }}"
  rescue:
    - name: Fail cleanup if directory removal fails due to locks
      ansible.builtin.fail:
        msg: |
          {{ build_stream_cleanup_failure_msg }}

- name: Check if target file exists
  ansible.builtin.stat:
    path: "{{ omnia_target }}"
  register: p

- name: Remove all omnia_build_stream services from omnia.target
  ansible.builtin.replace:
    path: "{{ omnia_target }}"
    regexp: "{{ build_stream_container_name }}.service"
    replace: ''
  when: p.stat.exists

- name: Remove playbook_watcher service from omnia.target
  ansible.builtin.replace:
    path: "{{ omnia_target }}"
    regexp: "playbook_watcher.service"
    replace: ''
  when: p.stat.exists


================================================
FILE: utils/roles/oim_cleanup/oim_container_cleanup/tasks/cleanup_common.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Remove allow list from chrony.conf
  ansible.builtin.lineinfile:
    path: /etc/chrony.conf
    regexp: ^allow
    line: ""
    state: absent

- name: Stop and disable chronyd service
  ansible.builtin.service:
    name: chronyd
    state: stopped
    enabled: false
    daemon_reload: true
  failed_when: false

- name: Stop and disable omnia.target systemd unit
  ansible.builtin.systemd:
    name: omnia.target
    state: stopped
    enabled: false
    daemon_reload: true
  failed_when: false

- name: Remove omnia.target systemd file
  ansible.builtin.file:
    path: "{{ item }}"
    state: absent
    force: true
  loop: "{{ omnia_target_file }}"
  become: true

- name: Remove telemetry directory if exists
  ansible.builtin.file:
    path: "{{ item }}"
    state: absent
    force: true
  register: directory_deletion
  until: directory_deletion is not failed
  retries: "{{ max_retries }}"
  failed_when: false
  with_items:
    - "{{ telemetry_cleanup_directory }}"

- name: Reload firewalld to apply changes
  ansible.builtin.command: firewall-cmd --reload
  changed_when: true

- name: Reload systemd daemon
  ansible.builtin.systemd:
    daemon_reload: true

- name: Reset failed systemd services
  ansible.builtin.command: systemctl reset-failed
  changed_when: false
  failed_when: false


================================================
FILE: utils/roles/oim_cleanup/oim_container_cleanup/tasks/cleanup_note.yml
================================================
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Display post-cleanup instructions
  ansible.builtin.debug:
    msg: "{{ oim_cleanup_note | split('\n') }}"


================================================
FILE: utils/roles/oim_cleanup/oim_container_cleanup/tasks/cleanup_omnia_postgres.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
- name: Set default postgres_backup parameter
  ansible.builtin.set_fact:
    postgres_backup: "{{ postgres_backup | default(true) }}"

- name: Display cleanup mode
  ansible.builtin.debug:
    msg: "{{ postgres_cleanup_mode_msg }}"

- name: Reload systemd daemon
  ansible.builtin.systemd:
    daemon_reload: true

- name: Populate service facts for omnia_postgres
  ansible.builtin.service_facts:

- name: Select omnia_postgres service units
  ansible.builtin.set_fact:
    postgres_services: >-
      {{ ansible_facts['services'].keys()
         | select('match', '^' + postgres_container_name)
         | list }}

- name: Stop omnia_postgres services
  ansible.builtin.systemd_service:
    name: "{{ item }}"
    state: stopped
  failed_when: false
  loop: "{{ postgres_services }}"
  when:
    - item in ansible_facts.services
    - ansible_facts.services[item].state == 'running'

- name: Locate omnia_postgres Quadlet files
  ansible.builtin.find:
    paths: "{{ quadlet_dir }}"
    patterns: "{{ postgres_container_name }}*"
    file_type: file
  register: postgres_quadlets

- name: Track omnia_postgres Quadlet paths
  ansible.builtin.set_fact:
    postgres_quadlet_paths: "{{ postgres_quadlets.files | map(attribute='path') | list }}"

- name: Remove omnia_postgres systemd unit files
  ansible.builtin.file:
    path: "{{ item }}"
    state: absent
  loop: "{{ postgres_quadlet_paths }}"
  when: postgres_quadlet_paths | length > 0

- name: Reload systemd daemon after removing omnia_postgres units
  ansible.builtin.systemd:
    daemon_reload: true

- name: Gather omnia_postgres container info
  containers.podman.podman_container_info:
    name: "{{ postgres_container_name }}"
  register: postgres_info
  failed_when: false

- name: Stop omnia_postgres container if present
  containers.podman.podman_container:
    name: "{{ postgres_container_name }}"
    state: stopped
  when: postgres_info.containers | length > 0

- name: Remove omnia_postgres container
  containers.podman.podman_container:
    name: "{{ postgres_container_name }}"
    state: absent
    force_delete: true
  when: postgres_info.containers | length > 0

- name: Get list of Postgres-related Podman volumes
  ansible.builtin.command:
    cmd: podman volume ls --format json
  register: podman_volumes_output
  changed_when: false
  failed_when: false
  when:
    - not postgres_backup | bool

- name: Parse Podman volumes
  ansible.builtin.set_fact:
    postgres_volumes: "{{ (podman_volumes_output.stdout | from_json) | selectattr('Name', 'search', postgres_container_name) | map(attribute='Name') | list }}"
  when:
    - not postgres_backup | bool
    - podman_volumes_output.rc == 0
    - podman_volumes_output.stdout | length > 0

- name: Remove Postgres-related Podman volumes when postgres_backup=false
  containers.podman.podman_volume:
    name: "{{ item }}"
    state: absent
    force: true
  loop: "{{ postgres_volumes | default([]) }}"
  when:
    - not postgres_backup | bool
    - postgres_volumes is defined
    - postgres_volumes | length > 0

- name: Log preserved volumes when postgres_backup=true
  ansible.builtin.debug:
    msg: "{{ postgres_preserved_volumes_msg }}"
  when:
    - postgres_backup | bool
    - postgres_volumes is defined
    - postgres_volumes | length > 0

- name: Remove omnia_postgres data directories when postgres_backup=false
  ansible.builtin.file:
    path: "{{ item }}"
    state: absent
    force: true
  loop: "{{ postgres_cleanup_directory }}"
  when: not postgres_backup | bool
  register: postgres_directory_deletion
  until: postgres_directory_deletion is not failed
  retries: "{{ max_retries }}"

- name: Log preserved data directories when postgres_backup=true
  ansible.builtin.debug:
    msg: "{{ postgres_preserved_msg }}"
  when: postgres_backup | bool

- name: Log deleted resources when postgres_backup=false
  ansible.builtin.debug:
    msg: "{{ postgres_deleted_msg }}"
  when: not postgres_backup | bool

- name: Check if omnia.target exists before cleaning postgres service entries
  ansible.builtin.stat:
    path: "{{ omnia_target }}"
  register: omnia_target_stat

- name: Remove omnia_postgres service from omnia.target
  ansible.builtin.replace:
    path: "{{ omnia_target }}"
    regexp: "{{ postgres_container_name }}.service"
    replace: ''
  when: omnia_target_stat.stat.exists


================================================
FILE: utils/roles/oim_cleanup/oim_container_cleanup/tasks/cleanup_openchami.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Remove OpenChami packages
  ansible.builtin.dnf:
    name: "{{ openchami_packages }}"
    state: absent

- name: Stop openchami.target systemd unit
  ansible.builtin.systemd:
    name: openchami.target
    state: stopped
    enabled: false
    daemon_reload: true
  failed_when: false

- name: Remove container systemd files
  ansible.builtin.file:
    path: "{{ item }}"
    state: absent
  loop: "{{ systemd_files }}"

- name: Reload systemd daemon
  ansible.builtin.systemd:
    daemon_reload: true

- name: Remove OpenChami containers
  containers.podman.podman_container:
    name: "{{ item }}"
    state: absent
    force_delete: true
  loop: "{{ openchami_containers }}"
  failed_when: false

- name: Remove OpenChami volumes
  containers.podman.podman_volume:
    name: "{{ item }}"
    state: absent
  loop: "{{ openchami_volumes }}"
  failed_when: false

- name: Remove OpenChami secrets
  containers.podman.podman_secret:
    name: "{{ item }}"
    state: absent
  loop: "{{ openchami_secrets }}"
  failed_when: false

- name: Remove TCP firewall ports
  ansible.builtin.firewalld:
    port: "{{ item }}/tcp"
    permanent: true
    state: disabled
    immediate: true
  loop: "{{ tcp_ports }}"

- name: Remove UDP firewall ports
  ansible.builtin.firewalld:
    port: "{{ item }}/udp"
    permanent: true
    state: disabled
    immediate: true
  loop: "{{ udp_ports }}"

- name: Remove podman interfaces from trusted zone
  ansible.builtin.firewalld:
    interface: "{{ item }}"
    zone: trusted
    permanent: true
    state: disabled
    immediate: true
  loop: "{{ podman_interfaces }}"

- name: Remove regctl config and binary
  ansible.builtin.file:
    path: "{{ item }}"
    state: absent
  loop: "{{ regctl_files }}"

- name: Remove OpenChami config directories
  ansible.builtin.file:
    path: "{{ item }}"
    state: absent
  loop: "{{ config_dirs }}"

- name: Stop and disable openchami services # noqa: command-instead-of-module
  ansible.builtin.command: systemctl stop {{ item }}
  changed_when: false
  loop: "{{ openchami_services }}"
  failed_when: false


================================================
FILE: utils/roles/oim_cleanup/oim_container_cleanup/tasks/cleanup_pulp.yml
================================================
#  Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---
- name: Reload systemd daemon
  ansible.builtin.systemd:
    daemon_reload: true

- name: Populate service facts
  ansible.builtin.service_facts:

- name: Stop pulp service
  ansible.builtin.systemd_service:
    name: "{{ pulp_container_name }}.service"
    state: stopped
  when:
    - ("pulp.service" in ansible_facts['services'])
    - ansible_facts.services['pulp.service'].state == 'running'

- name: Check if container file exists
  ansible.builtin.stat:
    path: "/etc/containers/systemd/{{ pulp_container_name }}.container"
  register: p

- name: Remove Pulp systemd unit files
  ansible.builtin.file:
    path: "/etc/containers/systemd/{{ pulp_container_name }}.container"
    state: absent
  when: p.stat.exists
  register: pulp_removed

- name: Reload systemd daemon
  ansible.builtin.systemd:
    daemon_reload: true
  when: p.stat.exists

- name: Check if Pulp container is running after deployment
  containers.podman.podman_container_info:
    name: "{{ pulp_container_name }}"
  register: pulp_container_status

- name: Stop the Pulp container
  containers.podman.podman_container:
    name: "{{ pulp_container_name }}"
    state: stopped
  when: pulp_container_status.containers | length > 0

- name: Remove Pulp container
  containers.podman.podman_container:
    name: "{{ pulp_container_name }}"
    state: absent
    force_delete: true

- name: Remove Pulp and Offline repo Directory
  ansible.builtin.file:
    path: "{{ item }}"
    state: absent
    force: true
  register: directory_deletion
  until: directory_deletion is not failed
  retries: "{{ max_retries }}"
  with_items:
    - "{{ pulp_cleanup_directory }}"

- name: Remove track file when pulp is in https
  ansible.builtin.file:
    path: "{{ track_file_path }}"
    state: absent
  when: pulp_protocol_https

- name: Check if target file exists
  ansible.builtin.stat:
    path: "{{ omnia_target }}"
  register: p

- name: Remove pulp.service
  ansible.builtin.replace:
    path: "{{ omnia_target }}"
    regexp: '(\b) pulp\.service(\b)'
    replace: ''
  when: p.stat.exists


================================================
FILE: utils/roles/oim_cleanup/oim_container_cleanup/tasks/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Define project input path
  ansible.builtin.set_fact:
    project_input_path: "{{ hostvars['localhost']['input_project_dir'] }}"
  tags: always

- name: Ensure firewalld is installed and running
  ansible.builtin.dnf:
    name: firewalld
    state: present
  tags: always

- name: Start and enable firewalld
  ansible.builtin.service:
    name: firewalld
    state: started
    enabled: true
  tags: always

- name: Cleanup pulp container
  ansible.builtin.import_tasks: cleanup_pulp.yml
  tags: pulp

- name: Cleanup openchami container
  ansible.builtin.import_tasks: cleanup_openchami.yml
  tags: openchami

- name: Cleanup auth container
  ansible.builtin.import_tasks: cleanup_auth.yml
  tags: auth

- name: Cleanup build_stream container
  ansible.builtin.import_tasks: cleanup_build_stream.yml
  when: hostvars['localhost']['enable_build_stream'] | bool
  tags: build_stream

- name: Cleanup omnia_postgres container
  ansible.builtin.import_tasks: cleanup_omnia_postgres.yml
  when: hostvars['localhost']['enable_build_stream'] | bool
  tags: postgres

- name: Cleanup common configuration
  ansible.builtin.import_tasks: cleanup_common.yml
  tags: common


================================================
FILE: utils/roles/oim_cleanup/oim_container_cleanup/vars/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

container_removal_failure_msg: " container could not be removed. Please check container logs."
omnia_nfs_share: "{{ hostvars['localhost']['oim_shared_path'] }}/omnia"
telemetry_cleanup_directory:
  - "{{ omnia_nfs_share }}/telemetry"
  - "{{ omnia_nfs_share }}/.secrets"
  - "{{ omnia_nfs_share }}/log/telemetry"
  - "{{ omnia_nfs_share }}/k8s_pvc_data"
  - "{{ omnia_nfs_share }}/service_cluster"
max_retries: 5
omnia_target: "/etc/systemd/system/omnia.target"

# Usage: cleanup_pulp.yml
pulp_protocol_https: true
pulp_container_name: "pulp"
pulp_cleanup_directory:
  - "{{ omnia_nfs_share }}/pulp/pulp_ha/cli.toml"
  - "{{ omnia_nfs_share }}/log/pulp"
  - "{{ omnia_nfs_share }}/pulp/settings"
  - "{{ omnia_nfs_share }}/pulp/nginx"
  - "{{ project_input_path }}/.local_repo_credentials_key"
  - "{{ omnia_nfs_share }}/offline_repo"
  - "{{ omnia_nfs_share }}/log/local_repo"
  - "{{ omnia_nfs_share }}/k8s_dynamic_json"
  - "{{ omnia_nfs_share }}/rhel_repo_certs"
track_file_path: "{{ omnia_nfs_share }}/pulp/pulp_crt_track.txt"

# Usage: cleanup_openchami.yml
openchami_packages:
  - ochami
  - openchami
  - s3cmd
  - epel-release

openchami_containers:
  - minio-server
  - registry
  - step-ca
  - postgres
  - hydra
  - opaal-idp
  - smd
  - bss
  - opaal
  - cloud-init-server
  - haproxy
  - coresmd

openchami_volumes:
  - haproxy-certs
  - acme-certs
  - postgres-data
  - step-ca-db
  - step-root-ca
  - step-ca-home

openchami_secrets:
  - hydra_postgres_password
  - hydra_dsn
  - hydra_system_secret
  - smd_postgres_password
  - postgres_password
  - postgres_multiple_databases
  - bss_postgres_password

tcp_ports:
  - 9000
  - 9001
  - 5000
  - 5432
  - 27778
  - 27779
  - 8081
  - 8443

udp_ports:
  - 69
  - 67
  - 68

podman_interfaces:
  - podman0
  - podman1
  - podman2
  - podman3
  - podman4

systemd_files:
  - /etc/containers/systemd/registry.container
  - /etc/containers/systemd/minio.container

quadlet_dir: "/etc/containers/systemd"

regctl_files:
  - ~/.regctl/config.json
  - /usr/local/bin/regctl

config_dirs:
  - /etc/openchami
  - /etc/ochami
  - "{{ omnia_nfs_share }}/openchami"
  - "{{ omnia_nfs_share }}/log/openchami"

omnia_target_file:
  - /etc/systemd/system/omnia.target
  - /etc/systemd/system/default.target.wants/omnia.target
  - /etc/systemd/system/multi-user.target.wants/omnia.target

openchami_services:
  - openchami.target
  - openchami-cert-internal-network.service
  - openchami-cert-trust.service
  - openchami-external-network.service
  - openchami-internal-network.service
  - openchami-jwt-internal-network.service
  - bss-init.service
  - smd-init.service
  - step-ca-db-volume.service
  - step-ca-home-volume.service
  - postgres-data-volume.service
  - hydra-gen-jwks.service
  - hydra-migrate.service
  - haproxy-certs-volume.service

# Usage: cleanup_auth.yml
auth_cleanup_directory:
  - "{{ omnia_nfs_share }}/auth"

auth_service_container_name: omnia_auth

# Usage: cleanup_build_stream.yml
build_stream_cleanup_directory:
  - "{{ omnia_nfs_share }}/log/build_stream"
  - "{{ omnia_nfs_share }}/playbook_queue"
  - "{{ omnia_nfs_share }}/build_stream_ssl"
  - "{{ omnia_nfs_share }}/build_stream_root"
  - "{{ omnia_nfs_share }}/build_stream_inv"
  - "{{ omnia_nfs_share }}/build_stream"

build_stream_container_name: omnia_build_stream
playbook_watcher_service_file: "/etc/systemd/system/playbook_watcher.service"

# Build stream cleanup failure message
build_stream_cleanup_failure_msg:
  - "Build stream cleanup failed due to directory locks."
  - "[Manual Intervention Required]"
  - "Logout of core container and perform below operations in OIM"
  - "1. Force stop the playbook watcher service:"
  - "   - systemctl stop playbook_watcher.service"
  - "   - systemctl disable playbook_watcher.service"
  - "2. Check for processes using the directory: Example:"
  - "   - lsof +D {{ omnia_nfs_share }}/log/build_stream"
  - "3. Force remove these directories:"
  - "   - {{ build_stream_cleanup_directory | join(', ') }}"
  - "After manual cleanup, you can safely retry the oim cleanup playbook from omnia_core."

# Usage: cleanup_postgres.yml
postgres_cleanup_directory:
  - "{{ omnia_nfs_share }}/postgres"

postgres_container_name: omnia_postgres
postgres_cleanup_mode_msg: "Postgres cleanup mode: {{ 'PRESERVE data (postgres_backup=true)'
 if postgres_backup | bool else 'DELETE data (postgres_backup=false)' }}"
postgres_preserved_msg: "PRESERVED: Postgres data directories retained (postgres_backup=true): {{ postgres_cleanup_directory }}"
postgres_preserved_volumes_msg: "PRESERVED: Postgres volumes retained (postgres_backup=true): {{ postgres_volumes | default([]) }}"
postgres_deleted_msg:
  - "DELETED: Postgres data directories removed (postgres_backup=false)"
  - "Directories: {{ postgres_cleanup_directory }}"
  - "Volumes: {{ postgres_volumes | default([]) }}"

# Usage: cleanup_note.yml
oim_cleanup_note: |
  [Post-Cleanup Actions Required]
  1. Reboot the OIM node after running oim_cleanup.yml.

  2. The playbook does NOT remove data stored under the NFS server_share_path (see /opt/omnia/input/project_default/storage_config.yml).
     - Using the same server_share_path may cause deployment failures or inconsistent Kubernetes/Slurm behavior.
     - For a fresh deployment, manually clean the contents of server_share_path or use a new NFS export/path.

  3. The omnia_core container is NOT removed by oim_cleanup.yml.
     - To delete it, log in to the OIM node and run:
       omnia.sh --uninstall


================================================
FILE: utils/roles/oim_cleanup/omnia_credential_cleanup/tasks/cleanup_credentials.yml
================================================
#  Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
#  Licensed under the Apache License, Version 2.0 (the "License");
#  you may not use this file except in compliance with the License.
#  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
#  limitations under the License.
---

- name: Delete omnia_credential_config
  ansible.builtin.file:
    path: "{{ omnia_credential_config }}"
    state: absent
  failed_when: false

- name: Delete omnia_credential_file vault key
  ansible.builtin.file:
    path: "{{ omnia_credential_config_key }}"
    state: absent
  failed_when: false

- name: Delete build_stream_oauth_credentials file
  ansible.builtin.file:
    path: "{{ bs_credential_config }}"
    state: absent
  failed_when: false

- name: Delete build_stream_oauth_credentials vault key
  ansible.builtin.file:
    path: "{{ bs_credential_config_key }}"
    state: absent
  failed_when: false

- name: Delete service cluster metadata file
  ansible.builtin.file:
    path: "{{ service_cluster_metadata_path }}"
    state: absent
  failed_when: false

- name: Delete functional groups configuration file
  ansible.builtin.file:
    path: "{{ functional_groups_config_path }}"
    state: absent
  failed_when: false


================================================
FILE: utils/roles/oim_cleanup/omnia_credential_cleanup/tasks/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Cleanup credentials
  ansible.builtin.import_tasks: cleanup_credentials.yml
  tags: credentials


================================================
FILE: utils/roles/oim_cleanup/omnia_credential_cleanup/vars/main.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# Usage: cleanup_credentials
omnia_credential_config: "{{ input_project_dir }}/omnia_config_credentials.yml"
omnia_credential_config_key: "{{ input_project_dir }}/.omnia_config_credentials_key"
bs_credential_config: "{{ input_project_dir }}/build_stream_oauth_credentials.yml"
bs_credential_config_key: "{{ input_project_dir }}/.build_stream_oauth_credentials_key"
service_cluster_metadata_path: "/opt/omnia/.data/service_cluster_metadata.yml"
functional_groups_config_path: "/opt/omnia/.data/functional_groups_config.yml"


================================================
FILE: utils/roles/oim_cleanup/pre_requisite/tasks/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Set default postgres_backup parameter
  ansible.builtin.set_fact:
    postgres_backup: "{{ postgres_backup | default(true) }}"

- name: Import pre-requisite tasks
  ansible.builtin.include_tasks: pre_requisite.yml
  tags: always


================================================
FILE: utils/roles/oim_cleanup/pre_requisite/tasks/pre_requisite.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

- name: Include metadata vars
  ansible.builtin.include_vars: "{{ omnia_metadata_file }}"
  register: include_metadata
  no_log: true

- name: Load software_config.json as software_config
  block:
    - name: Load software_config.json as user_config
      ansible.builtin.include_vars:
        file: "{{ software_config_file }}"
        name: software_config
      register: include_software_config
      no_log: true
  rescue:
    - name: Failed to load software_config.json as user_config
      ansible.builtin.fail:
        msg: "{{ software_config_syntax_fail_msg }} Error: {{ include_software_config.message }}"

- name: Include variable file local_repo_config.yml
  block:
    - name: Include variable file local_repo_config.yml
      ansible.builtin.include_vars: "{{ local_repo_config_file }}"
      register: include_local_repo_config
      no_log: true
  rescue:
    - name: Failed to include local_repo_config.yml
      ansible.builtin.fail:
        msg: "{{ local_repo_config_syntax_fail_msg }} Possible Syntax Error Hints: {{ include_local_repo_config.message }}"

- name: Load build stream configuration
  ansible.builtin.include_vars:
    file: "{{ build_stream_config_file }}"
    name: build_stream_config
  when:
    - hostvars['localhost']['input_project_dir'] is defined

- name: Set enable_build_stream from file build_stream_config.yml
  ansible.builtin.set_fact:
    enable_build_stream: "{{ build_stream_config.enable_build_stream | default(false) }}"

- name: Display cleanup mode
  ansible.builtin.debug:
    msg: "{{ postgres_cleanup_mode_msg }}"
  when: enable_build_stream

- name: Wait task to prompt user to preserve the postgres credentials.
  ansible.builtin.pause:
    prompt: "{{ postgres_credentials_backup_msg }}"
    seconds: "{{ wait_delay }}"
  when:
    - postgres_backup | bool
    - enable_build_stream

- name: Warn about GitLab cleanup when build stream is enabled
  ansible.builtin.pause:
    prompt: "{{ build_stream_cleanup_warning }}"
    seconds: "{{ build_stream_pause_seconds }}"
  when: enable_build_stream | default(false) | bool
  tags: always


================================================
FILE: utils/roles/oim_cleanup/pre_requisite/vars/main.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---

# Usage: pre_requisite.yml
omnia_metadata_file: "/opt/omnia/.data/oim_metadata.yml"
software_config_file: "{{ input_project_dir }}/software_config.json"
invalid_software_config_fail_msg: "Failed. Please provide valid software_config.json file with cluster_os_type, cluster_os_version, repo_config
  and repo_config values."
software_config_syntax_fail_msg: "Failed. Syntax errors present in software_config.json. Fix errors and re-run playbook again."
local_repo_config_file: "{{ input_project_dir }}/local_repo_config.yml"
local_repo_config_syntax_fail_msg: "Failed. Syntax errors present in local_repo_config.yml. Fix errors and re-run playbook again."
postgres_credentials_backup_msg: "Warning: Record or back up the Postgres credentials.
 They will be required later to restore data when running the prepare_oim playbook after oim_cleanup."
wait_delay: 30
postgres_cleanup_mode_msg: "Postgres cleanup mode: {{ 'PRESERVE data (postgres_backup=true)'
 if postgres_backup | bool else 'DELETE data (postgres_backup=false)' }}"

# Build stream configuration
build_stream_config_file: "{{ input_project_dir }}/build_stream_config.yml"
build_stream_cleanup_warning: |
  WARNING: Build Stream is enabled in your configuration.

  Before proceeding with OIM cleanup, it is required to run cleanup_gitlab.yml first for cleaning up the hosted gitlab deployment.

  The cleanup will continue automatically after 10 seconds...
  Press Ctrl+C to cancel if you need to run cleanup_gitlab.yml first.
build_stream_pause_seconds: 10


================================================
FILE: utils/roles/slurm_cleanup/defaults/main.yml
================================================
---

slurm_share_dir_name: slurm
slurm_cleanup_pre_backup_default: 'y'
slurm_cleanup_confirm_token: 'YES'


================================================
FILE: utils/roles/slurm_cleanup/tasks/main.yml
================================================
---

- name: Set slurm_config_path
  ansible.builtin.set_fact:
    slurm_config_path: "{{ share_path }}/{{ slurm_share_dir_name }}"
  tags: slurm_cleanup

- name: Prompt for pre-cleanup backup
  ansible.builtin.pause:
    prompt: "Before cleanup, take a config backup? (y/n)"
  register: pre_cleanup_backup
  tags: slurm_cleanup

- name: Set pre-cleanup backup choice
  ansible.builtin.set_fact:
    pre_cleanup_backup_choice: "{{ pre_cleanup_backup.user_input | default('') | trim | lower }}"
  tags: slurm_cleanup

- name: Fail if pre-cleanup backup choice is empty
  ansible.builtin.fail:
    msg: "No input provided for pre-cleanup backup prompt. Cleanup aborted."
  when: pre_cleanup_backup_choice | length == 0
  tags: slurm_cleanup

- name: Validate pre-cleanup backup choice
  ansible.builtin.fail:
    msg: "Invalid input '{{ pre_cleanup_backup.user_input | default('') }}'. Enter 'y' or 'n'."
  when: pre_cleanup_backup_choice not in ['y', 'yes', 'n', 'no']
  tags: slurm_cleanup

- name: Run config backup before cleanup
  ansible.builtin.include_role:
    name: slurm_config_backup
    apply:
      tags: slurm_cleanup
  when: pre_cleanup_backup_choice in ['y', 'yes']
  tags: slurm_cleanup

- name: Confirm cleanup
  ansible.builtin.pause:
    prompt: "This will delete {{ slurm_config_path }}. Type {{ slurm_cleanup_confirm_token }} to continue"
  register: cleanup_confirm
  tags: slurm_cleanup

- name: Fail if cleanup not confirmed
  ansible.builtin.fail:
    msg: "Cleanup aborted"
  when: cleanup_confirm.user_input != slurm_cleanup_confirm_token
  tags: slurm_cleanup

- name: Delete slurm share directory
  ansible.builtin.file:
    path: "{{ slurm_config_path }}"
    state: absent
  tags: slurm_cleanup


================================================
FILE: utils/roles/slurm_config_backup/defaults/main.yml
================================================
---

slurm_share_dir_name: slurm
slurm_backups_dir_name: slurm_backups


================================================
FILE: utils/roles/slurm_config_backup/tasks/main.yml
================================================
---

- name: Set slurm_config_path
  ansible.builtin.set_fact:
    slurm_config_path: "{{ share_path }}/{{ slurm_share_dir_name }}"

- name: Display resolved slurm config path
  ansible.builtin.debug:
    msg: "Resolved slurm_config_path={{ slurm_config_path }}"

- name: Prompt for backup base name
  ansible.builtin.pause:
    prompt: "Enter backup base name (leave empty for timestamp-only)"
  register: backup_base_name_input

- name: Set backup id
  ansible.builtin.set_fact:
    backup_timestamp: "{{ ansible_date_time.date }}_{{ ansible_date_time.time | replace(':', '-') }}"
    backup_base_name: "{{ backup_base_name_input.user_input | default('') }}"

- name: Set backup name suffix
  ansible.builtin.set_fact:
    backup_name_suffix: "{{ (backup_base_name | length > 0) | ternary(backup_base_name ~ '_' ~ backup_timestamp, backup_timestamp) }}"

- name: Set backup directory
  ansible.builtin.set_fact:
    slurm_backups_root: "{{ share_path }}/{{ slurm_backups_dir_name }}"
    backup_id: "{{ backup_name_suffix }}"
    backup_dir: "{{ share_path }}/{{ slurm_backups_dir_name }}/{{ backup_name_suffix }}"

- name: Ensure slurm backups root exists
  ansible.builtin.file:
    path: "{{ slurm_backups_root }}"
    state: directory
    mode: '0755'

- name: Display slurm backups root
  ansible.builtin.debug:
    msg: "Resolved slurm_backups_root={{ slurm_backups_root }}"

- name: Create backup directory
  ansible.builtin.file:
    path: "{{ backup_dir }}"
    state: directory
    mode: '0755'

- name: Create backup config directories
  ansible.builtin.file:
    path: "{{ backup_dir }}/{{ ctld_list[0] }}/{{ item }}"
    state: directory
    mode: '0755'
  loop:
    - etc/slurm
    - etc/munge
    - etc/my.cnf.d

- name: Backup controller config directories
  ansible.builtin.command: >-
    cp -a "{{ slurm_config_path }}/{{ ctld_list[0] }}/{{ item }}/." "{{ backup_dir }}/{{ ctld_list[0] }}/{{ item }}/"
  loop:
    - etc/slurm
    - etc/munge
    - etc/my.cnf.d
  changed_when: true
  failed_when: false

- name: Display backup location
  ansible.builtin.debug:
    msg: "Slurm config backup created at: {{ backup_dir }}/{{ ctld_list[0] }}"


================================================
FILE: utils/roles/slurm_config_rollback/defaults/main.yml
================================================
---

slurm_share_dir_name: slurm
slurm_backups_dir_name: slurm_backups
slurm_rollback_backup_list_limit_default: 20


================================================
FILE: utils/roles/slurm_config_rollback/tasks/main.yml
================================================
---

- name: Set slurm paths
  ansible.builtin.set_fact:
    slurm_config_path: "{{ share_path }}/{{ slurm_share_dir_name }}"
    slurm_backups_root: "{{ share_path }}/{{ slurm_backups_dir_name }}"
  tags: config_rollback

- name: Find available backups
  ansible.builtin.find:
    paths: "{{ slurm_backups_root }}"
    file_type: directory
    depth: 1
  register: backup_dirs
  tags: config_rollback

- name: Fail if no backups found
  ansible.builtin.fail:
    msg: "No backups found in {{ slurm_backups_root }}"
  when: backup_dirs.files | length == 0
  tags: config_rollback

- name: Set rollback backup list limit
  ansible.builtin.set_fact:
    rollback_backup_list_limit_effective: "{{ lookup('vars', 'rollback_backup_list_limit', default=slurm_rollback_backup_list_limit_default) | int }}"
  tags: config_rollback

- name: Build backup choices
  ansible.builtin.set_fact:
    backup_choices: >-
      {{
        (
          backup_dirs.files
          | sort(attribute='mtime', reverse=true)
          | map(attribute='path')
          | list
        )[:(rollback_backup_list_limit_effective | int)]
      }}
    total_backup_count: "{{ backup_dirs.files | length }}"
  tags: config_rollback

- name: Notify if backup list is truncated
  ansible.builtin.debug:
    msg: "Showing latest {{ rollback_backup_list_limit_effective }} backups out of {{ total_backup_count }}. Increase rollback_backup_list_limit to show more."
  when: (total_backup_count | int) > (rollback_backup_list_limit_effective | int)
  tags: config_rollback

- name: Display backup list order
  ansible.builtin.debug:
    msg: "Backup list is sorted latest first."
  tags: config_rollback

- name: Show backup choices
  ansible.builtin.debug:
    msg: "{{ backup_choice_index + 1 }}: {{ item | basename }}"
  loop: "{{ backup_choices }}"
  loop_control:
    index_var: backup_choice_index
  tags: config_rollback

- name: Prompt user to select backup number
  ansible.builtin.pause:
    prompt: "Enter the backup number to rollback to"
  register: backup_choice_input
  tags: config_rollback

- name: Set backup choice index
  ansible.builtin.set_fact:
    backup_choice_index: "{{ backup_choice_input.user_input | default('') | trim }}"
  tags: config_rollback

- name: Fail if backup selection is empty
  ansible.builtin.fail:
    msg: "No backup number selected. Rollback aborted."
  when: backup_choice_index | length == 0
  tags: config_rollback

- name: Validate backup choice input is within range
  ansible.builtin.fail:
    msg: "Invalid selection '{{ backup_choice_input.user_input | default('') }}'. Enter a number between 1 and {{ backup_choices | length }}."
  when:
    - (backup_choice_index | int) < 1 or (backup_choice_index | int) > (backup_choices | length)
  tags: config_rollback

- name: Set selected backup
  ansible.builtin.set_fact:
    selected_backup_dir: "{{ backup_choices[(backup_choice_index | int) - 1] }}"
  tags: config_rollback

- name: Set selected backup controller root
  ansible.builtin.set_fact:
    selected_backup_ctld_root: "{{ selected_backup_dir }}/{{ ctld_list[0] }}"
  tags: config_rollback

- name: Check slurm.conf exists in selected backup
  ansible.builtin.stat:
    path: "{{ selected_backup_ctld_root }}/etc/slurm/slurm.conf"
  register: slurm_conf_stat
  tags: config_rollback

- name: Fail if slurm.conf missing in backup
  ansible.builtin.fail:
    msg: "Selected backup is missing {{ ctld_list[0] }}/etc/slurm/slurm.conf"
  when: not slurm_conf_stat.stat.exists
  tags: config_rollback

- name: Check key slurm conf files existence in selected backup
  ansible.builtin.stat:
    path: "{{ selected_backup_ctld_root }}/etc/slurm/{{ item }}"
  loop:
    - slurmdbd.conf
    - cgroup.conf
    - gres.conf
  register: slurm_conf_files_stats
  tags: config_rollback

- name: Compute missing slurm conf files in selected backup
  ansible.builtin.set_fact:
    missing_slurm_conf_files: "{{ slurm_conf_files_stats.results | rejectattr('stat.exists') | map(attribute='item') | list }}"
  tags: config_rollback

- name: Warn if slurm conf files are missing in selected backup
  ansible.builtin.debug:
    msg: "WARNING: Missing files in selected backup under etc/slurm: {{ missing_slurm_conf_files }}"
  when: missing_slurm_conf_files | length > 0
  tags: config_rollback

- name: Prompt to continue if slurm conf files are missing
  ansible.builtin.pause:
    prompt: "Some slurm config files are missing in the selected backup. Continue anyway? (y/N)"
  register: continue_missing_confs
  when: missing_slurm_conf_files | length > 0
  tags: config_rollback

- name: Fail if user does not want to continue with missing slurm conf files
  ansible.builtin.fail:
    msg: "Rollback aborted"
  when:
    - missing_slurm_conf_files | length > 0
    - continue_missing_confs.user_input | default('N') | lower != 'y'
  tags: config_rollback

- name: Check munge.key exists in selected backup
  ansible.builtin.stat:
    path: "{{ selected_backup_ctld_root }}/etc/munge/munge.key"
  register: munge_key_stat
  tags: config_rollback

- name: Warn if munge.key is missing in selected backup
  ansible.builtin.debug:
    msg: "WARNING: munge.key is missing in selected backup under etc/munge."
  when: not munge_key_stat.stat.exists
  tags: config_rollback

- name: Prompt to continue if munge.key is missing
  ansible.builtin.pause:
    prompt: "munge.key is missing in the selected backup. Continue anyway? (y/N)"
  register: continue_missing_munge_key
  when: not munge_key_stat.stat.exists
  tags: config_rollback

- name: Fail if user does not want to continue without munge.key
  ansible.builtin.fail:
    msg: "Rollback aborted"
  when:
    - not munge_key_stat.stat.exists
    - continue_missing_munge_key.user_input | default('N') | lower != 'y'
  tags: config_rollback

- name: Check backup directories
  ansible.builtin.stat:
    path: "{{ selected_backup_ctld_root }}/{{ item }}"
  loop:
    - etc/slurm
    - etc/munge
    - etc/my.cnf.d
  register: backup_dir_stats
  tags: config_rollback

- name: Compute missing backup directories
  ansible.builtin.set_fact:
    missing_backup_dirs: "{{ backup_dir_stats.results | rejectattr('stat.exists') | map(attribute='item') | list }}"
  tags: config_rollback

- name: Warn if backup directories missing
  ansible.builtin.debug:
    msg: "WARNING: Missing directories in backup: {{ missing_backup_dirs }}"
  when: missing_backup_dirs | length > 0
  tags: config_rollback

- name: Prompt to continue if backup directories missing
  ansible.builtin.pause:
    prompt: "Some directories are missing in the backup. Continue anyway? (y/N)"
  register: continue_missing
  when: missing_backup_dirs | length > 0
  tags: config_rollback

- name: Fail if user does not want to continue
  ansible.builtin.fail:
    msg: "Rollback aborted"
  when:
    - missing_backup_dirs | length > 0
    - continue_missing.user_input | default('N') | lower != 'y'
  tags: config_rollback

- name: Prompt for safety backup before rollback
  ansible.builtin.pause:
    prompt: "Create a safety backup of current state before rollback? (y/n)"
  register: pre_rollback_backup
  tags: config_rollback

- name: Set pre-rollback backup choice
  ansible.builtin.set_fact:
    pre_rollback_backup_choice: "{{ pre_rollback_backup.user_input | default('') | trim | lower }}"
  tags: config_rollback

- name: Fail if pre-rollback backup choice is empty
  ansible.builtin.fail:
    msg: "No input provided for safety backup prompt. Rollback aborted."
  when: pre_rollback_backup_choice | length == 0
  tags: config_rollback

- name: Validate pre-rollback backup choice
  ansible.builtin.fail:
    msg: "Invalid input '{{ pre_rollback_backup.user_input | default('') }}'. Enter 'y' or 'n'."
  when: pre_rollback_backup_choice not in ['y', 'yes', 'n', 'no']
  tags: config_rollback

- name: Run safety backup before rollback
  ansible.builtin.include_role:
    name: slurm_config_backup
    apply:
      tags: config_rollback
  when: pre_rollback_backup_choice in ['y', 'yes']
  tags: config_rollback

- name: Stat slurmdbd.conf before restore
  ansible.builtin.stat:
    path: "{{ slurm_config_path }}/{{ ctld_list[0] }}/etc/slurm/slurmdbd.conf"
    checksum_algorithm: sha1
  register: slurmdbd_before
  tags: config_rollback

- name: Restore config directories
  ansible.builtin.copy:
    src: "{{ selected_backup_ctld_root }}/{{ item }}/"
    dest: "{{ slurm_config_path }}/{{ ctld_list[0] }}/{{ item }}/"
    remote_src: true
    mode: preserve
  loop:
    - etc/slurm
    - etc/munge
    - etc/my.cnf.d
  changed_when: true
  failed_when: false
  tags: config_rollback

- name: Check slurmdbd.conf permissions after restore
  ansible.builtin.stat:
    path: /etc/slurm/slurmdbd.conf
  delegate_to: slurm_controller
  register: slurmdbd_conf_perm_stat
  tags: config_rollback

- name: Fix slurmdbd.conf permissions after restore
  ansible.builtin.file:
    path: /etc/slurm/slurmdbd.conf
    mode: '0600'
  delegate_to: slurm_controller
  when: slurmdbd_conf_perm_stat.stat.exists
  tags: config_rollback

- name: Check munge.key permissions after restore
  ansible.builtin.stat:
    path: /etc/munge/munge.key
  delegate_to: slurm_controller
  register: munge_key_perm_stat
  tags: config_rollback

- name: Fix munge.key permissions after restore
  ansible.builtin.file:
    path: /etc/munge/munge.key
    mode: '0400'
  delegate_to: slurm_controller
  when: munge_key_perm_stat.stat.exists
  tags: config_rollback

- name: Stat slurmdbd.conf after restore
  ansible.builtin.stat:
    path: "{{ slurm_config_path }}/{{ ctld_list[0] }}/etc/slurm/slurmdbd.conf"
    checksum_algorithm: sha1
  register: slurmdbd_after
  tags: config_rollback

- name: Notify slurmdbd.conf changed
  ansible.builtin.debug:
    msg: "Detected slurmdbd.conf change after rollback; restarting slurmdbd."
  when:
    - slurmdbd_before.stat.exists
    - slurmdbd_after.stat.exists
    - slurmdbd_before.stat.checksum != slurmdbd_after.stat.checksum
  tags: config_rollback

- name: Restart slurmdbd
  ansible.builtin.systemd:
    name: slurmdbd
    state: restarted
  delegate_to: slurm_controller
  when:
    - slurmdbd_before.stat.exists
    - slurmdbd_after.stat.exists
    - slurmdbd_before.stat.checksum != slurmdbd_after.stat.checksum
  changed_when: true
  tags: config_rollback

- name: Gather service facts on controller
  ansible.builtin.service_facts:
  delegate_to: slurm_controller
  tags: config_rollback

- name: Set slurmctld state
  ansible.builtin.set_fact:
    slurmctld_state: "{{ ansible_facts.services['slurmctld.service'].state | default('unknown') }}"
  tags: config_rollback

- name: Fail if slurmctld is not active
  ansible.builtin.fail:
    msg: >-
      slurmctld is not active on the controller. Rollback applied on disk, but cannot
      reconfigure until slurmctld is running. Verify munge and slurmctld services and
      restart slurmctld, then re-run rollback or run 'scontrol reconfigure' on the
      controller.
  when: slurmctld_state != 'running'
  tags: config_rollback

- name: Run scontrol reconfigure
  tags: config_rollback
  block:
    - name: Execute scontrol reconfigure
      ansible.builtin.command: scontrol reconfigure
      delegate_to: slurm_controller
      register: reconfigure_out
      changed_when: true
      failed_when: reconfigure_out.rc != 0
  rescue:
    - name: Display scontrol reconfigure error
      ansible.builtin.debug:
        msg: "scontrol reconfigure failed. stdout={{ reconfigure_out.stdout | default('') }} stderr={{ reconfigure_out.stderr | default('') }}"

    - name: Fail with rollback guidance
      ansible.builtin.fail:
        msg: >-
          Rollback applied on disk, but scontrol reconfigure failed. Recommended action:
          rollback to the safety backup created before this rollback (if you chose to
          create it).


================================================
FILE: utils/set_pxe_boot.yml
================================================
# Copyright 2025 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
# -------------------------------------------------------------------------
# PXE PREREQUISITES
# -------------------------------------------------------------------------
# 1. Dell iDRAC BMCs must be reachable from the Ansible controller
# 2. The PXE order must be set in the BIOS/UEFI settings
# 3. PXE (Pre‑boot eXecution Environment) support – the NIC's
#    firmware must implement the PXE option and must be enabled.
# 4. The `dellemc.openmanage` Ansible collection must be installed:
#       ansible-galaxy collection install dellemc.openmanage
# 5. iDRAC firmware version must support the 'Boot Source Override'
#    API (most modern iDRAC9/10 firmware do).
# 5. The TFTP/NFS/HTTP server that provides the PXE
#    boot image must be reachable by the target nodes once the iDRAC
#    is set to PXE mode.
# -------------------------------------------------------------------------
- name: Validate BMC group exists in inventory
  hosts: localhost
  connection: local
  gather_facts: false
  tasks:
    - name: Check if bmc group exists in inventory
      ansible.builtin.fail:
        msg: "Failed. 'bmc' group not found in inventory or has no hosts.
         Please ensure the inventory file contains a 'bmc' group with at least one BMC IP address."
      when: groups['bmc'] is not defined or groups['bmc'] | length | int == 0

- name: Set_fact for fetch omnia config credentials
  hosts: localhost
  connection: local
  tags: always
  tasks:
    - name: Set dynamic run tags including 'provision'
      when: not config_file_status | default(false) | bool
      ansible.builtin.set_fact:
        omnia_run_tags: "{{ (ansible_run_tags | default([]) + ['provision']) | unique }}"
        cacheable: true

- name: Invoke get_config_credentials.yml
  ansible.builtin.import_playbook: credential_utility/get_config_credentials.yml

# This configures Dell iDRAC BMCs to boot a host from PXE (network) and optionally reboots the server.
# This will set the boot mode to pxe
- name: Reboot Host via PXE
  hosts: bmc
  connection: local
  strategy: host_pinned
  gather_facts: false
  roles:
    - role: idrac_pxe_boot
      # vars:
      #   restart_host: false # By default restart will be true, set to false not to restart
      #   force_restart: true # By default graceful_restart will happen, set to true to force restart

- name: Synchronized Reporting
  hosts: bmc
  connection: local
  gather_facts: false
  tasks:
    - name: Fail if reboot function failed
      ansible.builtin.fail:
        msg: "{{ reboot_status }}"
      when: reboot_failed

    - name: Show passed iDRACs
      ansible.builtin.debug:
        msg: "{{ inventory_hostname }}: {{ reboot_status }}"


================================================
FILE: utils/slurm_config_util.yml
================================================
---

- name: Include input project directory
  when: not project_dir_status | default(false) | bool
  ansible.builtin.import_playbook: include_input_dir.yml
  vars:
    omnia_metadata_support: true
  tags: always

- name: Create oim group
  ansible.builtin.import_playbook: create_container_group.yml
  vars:
    oim_group: true
  tags: always

- name: Slurm config utilities
  hosts: oim
  connection: ssh
  gather_facts: true
  tasks:
    - name: Include variable file omnia_config.yml
      ansible.builtin.include_vars: "{{ hostvars['localhost']['input_project_dir'] }}/omnia_config.yml"
      tags: always

    - name: Include storage vars
      ansible.builtin.include_vars: "{{ hostvars['localhost']['input_project_dir'] }}/storage_config.yml"
      tags: always

    - name: Set facts for slurm
      ansible.builtin.set_fact:
        nfs_storage_name: "{{ slurm_cluster[0].nfs_storage_name }}"
      tags: always

    - name: Read the slurm mount point
      ansible.builtin.set_fact:
        share_path: "{{ (nfs_client_params | selectattr('nfs_name', 'equalto', nfs_storage_name) | first).client_share_path }}"
      tags: always

    - name: Slurp remote YAML file
      ansible.builtin.slurp:
        src: "{{ hostvars['localhost']['oim_shared_path'] }}/omnia/openchami/workdir/nodes/nodes.yaml"
      register: slurped_yaml
      tags: always

    - name: Parse YAML into vars
      ansible.builtin.set_fact:
        node_yaml: "{{ slurped_yaml.content | b64decode | from_yaml }}"
      tags: always

    - name: Get name and IP mapping 1
      ansible.builtin.set_fact:
        tmp_ip_name_map: "{{ node_yaml.nodes | items2dict(key_name='name', value_name='interfaces') }}"
      tags: always

    - name: Get name and IP mapping 2
      ansible.builtin.set_fact:
        ip_name_map: "{{ ip_name_map | default({}) | combine({item.key: item.value[0]['ip_addrs'][0]['ip_addr']}) }}"
      loop: "{{ tmp_ip_name_map | dict2items }}"
      tags: always

    - name: Read the node name group
      ansible.builtin.set_fact:
        name_group_map: "{{ node_yaml.nodes | items2dict(key_name='name', value_name='group') }}"
      tags: always

    - name: Group the functional_groups
      ansible.builtin.set_fact:
        tmp_grouped_nodes: "{{ name_group_map | dict2items | groupby('value') }}"
      tags: always

    - name: Re-organize the groups
      ansible.builtin.set_fact:
        grouped_nodes: "{{ grouped_nodes | default({}) | combine({item[0]: ((item[1] | items2dict).keys() | list)}) }}"
      loop: "{{ tmp_grouped_nodes }}"
      tags: always

    - name: Assign slurm lists
      ansible.builtin.set_fact:
        ctld_list: "{{ grouped_nodes | dict2items
                       | selectattr('key', 'match', '^' ~ 'slurm_control_node_')
                       | map(attribute='value') | list | flatten }}"
      tags: always

    - name: Fail if Slurm controller list is empty
      ansible.builtin.fail:
        msg: "Slurm controller functional group is missing from PXE mapping file. Please update the file and rerun."
      when: ctld_list | length == 0
      tags: always

    - name: Set slurm controller IP
      ansible.builtin.set_fact:
        controller_ip: "{{ ip_name_map[ctld_list | first] }}"
      when: ctld_list | length > 0
      tags: always

    - name: Add slurm controller as dynamic host
      ansible.builtin.add_host:
        name: slurm_controller
        ansible_host: "{{ controller_ip }}"
        ansible_user: root
        ansible_port: 22
      when: controller_ip is defined
      tags: always

    - name: Run slurm config backup
      ansible.builtin.include_role:
        name: slurm_config_backup
        apply:
          tags: config_backup
      tags: config_backup

    - name: Run slurm cleanup
      ansible.builtin.include_role:
        name: slurm_cleanup
        apply:
          tags: slurm_cleanup
      tags: slurm_cleanup

    - name: Run slurm config rollback
      ansible.builtin.include_role:
        name: slurm_config_rollback
        apply:
          tags: config_rollback
      tags: config_rollback


================================================
FILE: utils/upgrade_checkup.yml
================================================
# Copyright 2026 Dell Inc. or its subsidiaries. All Rights Reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
#     http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
---
- name: "Guard: block if upgrade is in progress"
  hosts: localhost
  connection: local
  gather_facts: false
  tasks:
    - name: Check upgrade lock file
      ansible.builtin.stat:
        path: /opt/omnia/.data/upgrade_in_progress.lock
      register: upgrade_lock

    - name: Block playbook while upgrade is in progress
      ansible.builtin.fail:
        msg: >-
          Upgrade is not completed fully.
          Please run upgrade_omnia.yml to complete upgrade before running any other playbook using the below command:
          "ansible-playbook /omnia/upgrade/upgrade_omnia.yml"
          If you don't require input files to be migrated, reconfigure the default input files, remove the lock file using the following command
          "rm /opt/omnia/.data/upgrade_in_progress.lock" and then proceed.
      when: upgrade_lock.stat.exists